[ { "page_no": 0, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 128.6, "r_x1": 480.6, "r_y1": 128.6, "r_x2": 480.6, "r_y2": 115.9, "r_x3": 134.8, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 266.7, "r_y0": 146.5, "r_x1": 348.7, "r_y1": 146.5, "r_x2": 348.7, "r_y2": 133.8, "r_x3": 266.7, "r_y3": 133.8, "coord_origin": "TOPLEFT" }, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.2, "r_y0": 180.5, "r_x1": 217.0, "r_y1": 180.5, "r_x2": 217.0, "r_y2": 171.7, "r_x3": 151.2, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.0, "r_y0": 176.3, "r_x1": 235.2, "r_y1": 176.3, "r_x2": 235.2, "r_y2": 170.1, "r_x3": 217.0, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.2, "r_y0": 176.3, "r_x1": 241.4, "r_y1": 176.3, "r_x2": 241.4, "r_y2": 169.7, "r_x3": 235.2, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.4, "r_y0": 176.3, "r_x1": 257.3, "r_y1": 176.3, "r_x2": 257.3, "r_y2": 170.1, "r_x3": 241.4, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.3, "r_x1": 263.5, "r_y1": 176.3, "r_x2": 263.5, "r_y2": 169.7, "r_x3": 257.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.5, "r_y0": 176.3, "r_x1": 279.4, "r_y1": 176.3, "r_x2": 279.4, "r_y2": 170.1, "r_x3": 263.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.4, "r_y0": 176.3, "r_x1": 285.6, "r_y1": 176.3, "r_x2": 285.6, "r_y2": 169.7, "r_x3": 279.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.6, "r_y0": 180.5, "r_x1": 392.3, "r_y1": 180.5, "r_x2": 392.3, "r_y2": 171.7, "r_x3": 285.6, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.3, "r_y0": 176.3, "r_x1": 398.5, "r_y1": 176.3, "r_x2": 398.5, "r_y2": 169.7, "r_x3": 392.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.3, "r_x1": 414.4, "r_y1": 176.3, "r_x2": 414.4, "r_y2": 170.1, "r_x3": 398.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.4, "r_y0": 176.3, "r_x1": 420.6, "r_y1": 176.3, "r_x2": 420.6, "r_y2": 169.7, "r_x3": 414.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.6, "r_y0": 176.3, "r_x1": 436.5, "r_y1": 176.3, "r_x2": 436.5, "r_y2": 170.1, "r_x3": 420.6, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.3, "r_x1": 442.7, "r_y1": 176.3, "r_x2": 442.7, "r_y2": 169.7, "r_x3": 436.5, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.7, "r_y0": 180.5, "r_x1": 464.1, "r_y1": 180.5, "r_x2": 464.1, "r_y2": 171.7, "r_x3": 442.7, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.3, "r_y0": 192.4, "r_x1": 224.8, "r_y1": 192.4, "r_x2": 224.8, "r_y2": 183.6, "r_x3": 139.3, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.8, "r_y0": 188.2, "r_x1": 242.9, "r_y1": 188.2, "r_x2": 242.9, "r_y2": 182.0, "r_x3": 224.8, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.9, "r_y0": 188.2, "r_x1": 249.2, "r_y1": 188.2, "r_x2": 249.2, "r_y2": 181.6, "r_x3": 242.9, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.2, "r_y0": 188.2, "r_x1": 265.1, "r_y1": 188.2, "r_x2": 265.1, "r_y2": 182.0, "r_x3": 249.2, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.1, "r_y0": 188.2, "r_x1": 271.3, "r_y1": 188.2, "r_x2": 271.3, "r_y2": 181.6, "r_x3": 265.1, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 188.2, "r_x1": 287.2, "r_y1": 188.2, "r_x2": 287.2, "r_y2": 182.0, "r_x3": 271.3, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.2, "r_y0": 188.2, "r_x1": 293.4, "r_y1": 188.2, "r_x2": 293.4, "r_y2": 181.6, "r_x3": 287.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.4, "r_x1": 404.2, "r_y1": 192.4, "r_x2": 404.2, "r_y2": 183.6, "r_x3": 293.4, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.2, "r_y0": 188.2, "r_x1": 410.4, "r_y1": 188.2, "r_x2": 410.4, "r_y2": 181.6, "r_x3": 404.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.4, "r_y0": 188.2, "r_x1": 426.3, "r_y1": 188.2, "r_x2": 426.3, "r_y2": 182.0, "r_x3": 410.4, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.3, "r_y0": 188.2, "r_x1": 432.5, "r_y1": 188.2, "r_x2": 432.5, "r_y2": 181.6, "r_x3": 426.3, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.2, "r_x1": 448.4, "r_y1": 188.2, "r_x2": 448.4, "r_y2": 182.0, "r_x3": 432.5, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.4, "r_y0": 188.2, "r_x1": 454.6, "r_y1": 188.2, "r_x2": 454.6, "r_y2": 181.6, "r_x3": 448.4, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.6, "r_y0": 192.4, "r_x1": 476.0, "r_y1": 192.4, "r_x2": 476.0, "r_y2": 183.6, "r_x3": 454.6, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.5, "r_y0": 204.4, "r_x1": 298.6, "r_y1": 204.4, "r_x2": 298.6, "r_y2": 195.6, "r_x3": 229.5, "r_y3": 195.6, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.6, "r_y0": 200.2, "r_x1": 316.7, "r_y1": 200.2, "r_x2": 316.7, "r_y2": 194.0, "r_x3": 298.6, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.7, "r_y0": 200.2, "r_x1": 323.0, "r_y1": 200.2, "r_x2": 323.0, "r_y2": 193.6, "r_x3": 316.7, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.0, "r_y0": 200.2, "r_x1": 338.9, "r_y1": 200.2, "r_x2": 338.9, "r_y2": 194.0, "r_x3": 323.0, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.9, "r_y0": 200.2, "r_x1": 345.1, "r_y1": 200.2, "r_x2": 345.1, "r_y2": 193.6, "r_x3": 338.9, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.1, "r_y0": 200.2, "r_x1": 361.0, "r_y1": 200.2, "r_x2": 361.0, "r_y2": 194.0, "r_x3": 345.1, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.0, "r_y0": 200.2, "r_x1": 367.2, "r_y1": 200.2, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 361.0, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.2, "r_x1": 385.3, "r_y1": 200.2, "r_x2": 385.3, "r_y2": 194.0, "r_x3": 367.2, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1, "r_y0": 225.3, "r_x1": 336.3, "r_y1": 225.3, "r_x2": 336.3, "r_y2": 217.2, "r_x3": 279.1, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.0, "r_y0": 236.3, "r_x1": 392.4, "r_y1": 236.3, "r_x2": 392.4, "r_y2": 228.8, "r_x3": 223.0, "r_y3": 228.8, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 278.2, "r_x1": 206.6, "r_y1": 278.2, "r_x2": 206.6, "r_y2": 270.3, "r_x3": 163.1, "r_y3": 270.3, "coord_origin": "TOPLEFT" }, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.6, "r_y0": 278.4, "r_x1": 452.2, "r_y1": 278.4, "r_x2": 452.2, "r_y2": 270.4, "r_x3": 211.6, "r_y3": 270.4, "coord_origin": "TOPLEFT" }, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 289.4, "r_x1": 452.2, "r_y1": 289.4, "r_x2": 452.2, "r_y2": 281.3, "r_x3": 163.1, "r_y3": 281.3, "coord_origin": "TOPLEFT" }, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 300.4, "r_x1": 452.2, "r_y1": 300.4, "r_x2": 452.2, "r_y2": 292.3, "r_x3": 163.1, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 311.3, "r_x1": 452.2, "r_y1": 311.3, "r_x2": 452.2, "r_y2": 303.2, "r_x3": 163.1, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 322.3, "r_x1": 452.2, "r_y1": 322.3, "r_x2": 452.2, "r_y2": 314.2, "r_x3": 163.1, "r_y3": 314.2, "coord_origin": "TOPLEFT" }, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 333.2, "r_x1": 452.2, "r_y1": 333.2, "r_x2": 452.2, "r_y2": 325.2, "r_x3": 163.1, "r_y3": 325.2, "coord_origin": "TOPLEFT" }, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 344.2, "r_x1": 452.2, "r_y1": 344.2, "r_x2": 452.2, "r_y2": 336.1, "r_x3": 163.1, "r_y3": 336.1, "coord_origin": "TOPLEFT" }, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 355.1, "r_x1": 452.2, "r_y1": 355.1, "r_x2": 452.2, "r_y2": 347.1, "r_x3": 163.1, "r_y3": 347.1, "coord_origin": "TOPLEFT" }, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 366.1, "r_x1": 452.2, "r_y1": 366.1, "r_x2": 452.2, "r_y2": 358.0, "r_x3": 163.1, "r_y3": 358.0, "coord_origin": "TOPLEFT" }, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 377.1, "r_x1": 452.2, "r_y1": 377.1, "r_x2": 452.2, "r_y2": 369.0, "r_x3": 163.1, "r_y3": 369.0, "coord_origin": "TOPLEFT" }, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 388.0, "r_x1": 452.2, "r_y1": 388.0, "r_x2": 452.2, "r_y2": 380.0, "r_x3": 163.1, "r_y3": 380.0, "coord_origin": "TOPLEFT" }, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 399.0, "r_x1": 452.2, "r_y1": 399.0, "r_x2": 452.2, "r_y2": 390.9, "r_x3": 163.1, "r_y3": 390.9, "coord_origin": "TOPLEFT" }, "text": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 409.9, "r_x1": 452.2, "r_y1": 409.9, "r_x2": 452.2, "r_y2": 401.9, "r_x3": 163.1, "r_y3": 401.9, "coord_origin": "TOPLEFT" }, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 420.9, "r_x1": 452.2, "r_y1": 420.9, "r_x2": 452.2, "r_y2": 412.8, "r_x3": 163.1, "r_y3": 412.8, "coord_origin": "TOPLEFT" }, "text": "accuracy improves significantly, inference time is halved compared to", "orig": "accuracy improves significantly, inference time is halved compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 431.9, "r_x1": 452.2, "r_y1": 431.9, "r_x2": 452.2, "r_y2": 423.8, "r_x3": 163.1, "r_y3": 423.8, "coord_origin": "TOPLEFT" }, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 442.8, "r_x1": 452.2, "r_y1": 442.8, "r_x2": 452.2, "r_y2": 434.7, "r_x3": 163.1, "r_y3": 434.7, "coord_origin": "TOPLEFT" }, "text": "tactically correct. This in turn eliminates most post-processing needs.", "orig": "tactically correct. This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 453.8, "r_x1": 452.2, "r_y1": 453.8, "r_x2": 452.2, "r_y2": 445.7, "r_x3": 163.1, "r_y3": 445.7, "coord_origin": "TOPLEFT" }, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 464.7, "r_x1": 225.6, "r_y1": 464.7, "r_x2": 225.6, "r_y2": 456.7, "r_x3": 163.1, "r_y3": 456.7, "coord_origin": "TOPLEFT" }, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 486.6, "r_x1": 211.9, "r_y1": 486.6, "r_x2": 211.9, "r_y2": 478.7, "r_x3": 163.1, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.6, "r_y0": 486.8, "r_x1": 452.2, "r_y1": 486.8, "r_x2": 452.2, "r_y2": 478.8, "r_x3": 216.6, "r_y3": 478.8, "coord_origin": "TOPLEFT" }, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 497.8, "r_x1": 257.6, "r_y1": 497.8, "r_x2": 257.6, "r_y2": 489.7, "r_x3": 163.1, "r_y3": 489.7, "coord_origin": "TOPLEFT" }, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 532.7, "r_x1": 141.5, "r_y1": 532.7, "r_x2": 141.5, "r_y2": 522.1, "r_x3": 134.8, "r_y3": 522.1, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 532.7, "r_x1": 228.9, "r_y1": 532.7, "r_x2": 228.9, "r_y2": 522.1, "r_x3": 154.9, "r_y3": 522.1, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.1, "r_x1": 480.6, "r_y1": 557.1, "r_x2": 480.6, "r_y2": 548.3, "r_x3": 134.8, "r_y3": 548.3, "coord_origin": "TOPLEFT" }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.0, "r_x1": 480.6, "r_y1": 569.0, "r_x2": 480.6, "r_y2": 560.2, "r_x3": 134.8, "r_y3": 560.2, "coord_origin": "TOPLEFT" }, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.0, "r_x1": 480.6, "r_y1": 581.0, "r_x2": 480.6, "r_y2": 572.2, "r_x3": 134.8, "r_y3": 572.2, "coord_origin": "TOPLEFT" }, "text": "valuable information and therefore need to be extracted with high accuracy.", "orig": "valuable information and therefore need to be extracted with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 592.9, "r_x1": 480.6, "r_y1": 592.9, "r_x2": 480.6, "r_y2": 584.2, "r_x3": 134.8, "r_y3": 584.2, "coord_origin": "TOPLEFT" }, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 604.9, "r_x1": 480.6, "r_y1": 604.9, "r_x2": 480.6, "r_y2": 596.1, "r_x3": 134.8, "r_y3": 596.1, "coord_origin": "TOPLEFT" }, "text": "ture, making it difficult to recover their correct structure with simple analyt-", "orig": "ture, making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 616.9, "r_x1": 480.6, "r_y1": 616.9, "r_x2": 480.6, "r_y2": 608.1, "r_x3": 134.8, "r_y3": 608.1, "coord_origin": "TOPLEFT" }, "text": "ical methods. Therefore, accurate table extraction is achieved these days with", "orig": "ical methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 628.8, "r_x1": 279.3, "r_y1": 628.8, "r_x2": 279.3, "r_y2": 620.0, "r_x3": 134.8, "r_y3": 620.0, "coord_origin": "TOPLEFT" }, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 149.7, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.3, "r_y0": 555.0, "r_x1": 36.3, "r_y1": 555.0, "r_x2": 36.3, "r_y2": 209.5, "r_x3": 18.3, "r_y3": 209.5, "coord_origin": "TOPLEFT" }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "orig": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "section_header", "bbox": { "l": 134.8, "t": 115.9, "r": 480.6, "b": 146.5, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 128.6, "r_x1": 480.6, "r_y1": 128.6, "r_x2": 480.6, "r_y2": 115.9, "r_x3": 134.8, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 266.7, "r_y0": 146.5, "r_x1": 348.7, "r_y1": 146.5, "r_x2": 348.7, "r_y2": 133.8, "r_x3": 266.7, "r_y3": 133.8, "coord_origin": "TOPLEFT" }, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "key_value_region", "bbox": { "l": 139.3, "t": 169.7, "r": 476.0, "b": 236.3, "coord_origin": "TOPLEFT" }, "confidence": 0.48, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.2, "r_y0": 180.5, "r_x1": 217.0, "r_y1": 180.5, "r_x2": 217.0, "r_y2": 171.7, "r_x3": 151.2, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.0, "r_y0": 176.3, "r_x1": 235.2, "r_y1": 176.3, "r_x2": 235.2, "r_y2": 170.1, "r_x3": 217.0, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.2, "r_y0": 176.3, "r_x1": 241.4, "r_y1": 176.3, "r_x2": 241.4, "r_y2": 169.7, "r_x3": 235.2, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.4, "r_y0": 176.3, "r_x1": 257.3, "r_y1": 176.3, "r_x2": 257.3, "r_y2": 170.1, "r_x3": 241.4, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.3, "r_x1": 263.5, "r_y1": 176.3, "r_x2": 263.5, "r_y2": 169.7, "r_x3": 257.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.5, "r_y0": 176.3, "r_x1": 279.4, "r_y1": 176.3, "r_x2": 279.4, "r_y2": 170.1, "r_x3": 263.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.4, "r_y0": 176.3, "r_x1": 285.6, "r_y1": 176.3, "r_x2": 285.6, "r_y2": 169.7, "r_x3": 279.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.6, "r_y0": 180.5, "r_x1": 392.3, "r_y1": 180.5, "r_x2": 392.3, "r_y2": 171.7, "r_x3": 285.6, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.3, "r_y0": 176.3, "r_x1": 398.5, "r_y1": 176.3, "r_x2": 398.5, "r_y2": 169.7, "r_x3": 392.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.3, "r_x1": 414.4, "r_y1": 176.3, "r_x2": 414.4, "r_y2": 170.1, "r_x3": 398.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.4, "r_y0": 176.3, "r_x1": 420.6, "r_y1": 176.3, "r_x2": 420.6, "r_y2": 169.7, "r_x3": 414.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.6, "r_y0": 176.3, "r_x1": 436.5, "r_y1": 176.3, "r_x2": 436.5, "r_y2": 170.1, "r_x3": 420.6, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.3, "r_x1": 442.7, "r_y1": 176.3, "r_x2": 442.7, "r_y2": 169.7, "r_x3": 436.5, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.7, "r_y0": 180.5, "r_x1": 464.1, "r_y1": 180.5, "r_x2": 464.1, "r_y2": 171.7, "r_x3": 442.7, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.3, "r_y0": 192.4, "r_x1": 224.8, "r_y1": 192.4, "r_x2": 224.8, "r_y2": 183.6, "r_x3": 139.3, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.8, "r_y0": 188.2, "r_x1": 242.9, "r_y1": 188.2, "r_x2": 242.9, "r_y2": 182.0, "r_x3": 224.8, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.9, "r_y0": 188.2, "r_x1": 249.2, "r_y1": 188.2, "r_x2": 249.2, "r_y2": 181.6, "r_x3": 242.9, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.2, "r_y0": 188.2, "r_x1": 265.1, "r_y1": 188.2, "r_x2": 265.1, "r_y2": 182.0, "r_x3": 249.2, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.1, "r_y0": 188.2, "r_x1": 271.3, "r_y1": 188.2, "r_x2": 271.3, "r_y2": 181.6, "r_x3": 265.1, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 188.2, "r_x1": 287.2, "r_y1": 188.2, "r_x2": 287.2, "r_y2": 182.0, "r_x3": 271.3, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.2, "r_y0": 188.2, "r_x1": 293.4, "r_y1": 188.2, "r_x2": 293.4, "r_y2": 181.6, "r_x3": 287.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.4, "r_x1": 404.2, "r_y1": 192.4, "r_x2": 404.2, "r_y2": 183.6, "r_x3": 293.4, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.2, "r_y0": 188.2, "r_x1": 410.4, "r_y1": 188.2, "r_x2": 410.4, "r_y2": 181.6, "r_x3": 404.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.4, "r_y0": 188.2, "r_x1": 426.3, "r_y1": 188.2, "r_x2": 426.3, "r_y2": 182.0, "r_x3": 410.4, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.3, "r_y0": 188.2, "r_x1": 432.5, "r_y1": 188.2, "r_x2": 432.5, "r_y2": 181.6, "r_x3": 426.3, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.2, "r_x1": 448.4, "r_y1": 188.2, "r_x2": 448.4, "r_y2": 182.0, "r_x3": 432.5, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.4, "r_y0": 188.2, "r_x1": 454.6, "r_y1": 188.2, "r_x2": 454.6, "r_y2": 181.6, "r_x3": 448.4, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.6, "r_y0": 192.4, "r_x1": 476.0, "r_y1": 192.4, "r_x2": 476.0, "r_y2": 183.6, "r_x3": 454.6, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.5, "r_y0": 204.4, "r_x1": 298.6, "r_y1": 204.4, "r_x2": 298.6, "r_y2": 195.6, "r_x3": 229.5, "r_y3": 195.6, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.6, "r_y0": 200.2, "r_x1": 316.7, "r_y1": 200.2, "r_x2": 316.7, "r_y2": 194.0, "r_x3": 298.6, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.7, "r_y0": 200.2, "r_x1": 323.0, "r_y1": 200.2, "r_x2": 323.0, "r_y2": 193.6, "r_x3": 316.7, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.0, "r_y0": 200.2, "r_x1": 338.9, "r_y1": 200.2, "r_x2": 338.9, "r_y2": 194.0, "r_x3": 323.0, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.9, "r_y0": 200.2, "r_x1": 345.1, "r_y1": 200.2, "r_x2": 345.1, "r_y2": 193.6, "r_x3": 338.9, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.1, "r_y0": 200.2, "r_x1": 361.0, "r_y1": 200.2, "r_x2": 361.0, "r_y2": 194.0, "r_x3": 345.1, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.0, "r_y0": 200.2, "r_x1": 367.2, "r_y1": 200.2, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 361.0, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.2, "r_x1": 385.3, "r_y1": 200.2, "r_x2": 385.3, "r_y2": 194.0, "r_x3": 367.2, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1, "r_y0": 225.3, "r_x1": 336.3, "r_y1": 225.3, "r_x2": 336.3, "r_y2": 217.2, "r_x3": 279.1, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.0, "r_y0": 236.3, "r_x1": 392.4, "r_y1": 236.3, "r_x2": 392.4, "r_y2": 228.8, "r_x3": 223.0, "r_y3": 228.8, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 139.3, "t": 169.7, "r": 476.0, "b": 200.2, "coord_origin": "TOPLEFT" }, "confidence": 0.79, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.2, "r_y0": 180.5, "r_x1": 217.0, "r_y1": 180.5, "r_x2": 217.0, "r_y2": 171.7, "r_x3": 151.2, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.0, "r_y0": 176.3, "r_x1": 235.2, "r_y1": 176.3, "r_x2": 235.2, "r_y2": 170.1, "r_x3": 217.0, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.2, "r_y0": 176.3, "r_x1": 241.4, "r_y1": 176.3, "r_x2": 241.4, "r_y2": 169.7, "r_x3": 235.2, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.4, "r_y0": 176.3, "r_x1": 257.3, "r_y1": 176.3, "r_x2": 257.3, "r_y2": 170.1, "r_x3": 241.4, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.3, "r_x1": 263.5, "r_y1": 176.3, "r_x2": 263.5, "r_y2": 169.7, "r_x3": 257.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.5, "r_y0": 176.3, "r_x1": 279.4, "r_y1": 176.3, "r_x2": 279.4, "r_y2": 170.1, "r_x3": 263.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.4, "r_y0": 176.3, "r_x1": 285.6, "r_y1": 176.3, "r_x2": 285.6, "r_y2": 169.7, "r_x3": 279.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.6, "r_y0": 180.5, "r_x1": 392.3, "r_y1": 180.5, "r_x2": 392.3, "r_y2": 171.7, "r_x3": 285.6, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.3, "r_y0": 176.3, "r_x1": 398.5, "r_y1": 176.3, "r_x2": 398.5, "r_y2": 169.7, "r_x3": 392.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.3, "r_x1": 414.4, "r_y1": 176.3, "r_x2": 414.4, "r_y2": 170.1, "r_x3": 398.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.4, "r_y0": 176.3, "r_x1": 420.6, "r_y1": 176.3, "r_x2": 420.6, "r_y2": 169.7, "r_x3": 414.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.6, "r_y0": 176.3, "r_x1": 436.5, "r_y1": 176.3, "r_x2": 436.5, "r_y2": 170.1, "r_x3": 420.6, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.3, "r_x1": 442.7, "r_y1": 176.3, "r_x2": 442.7, "r_y2": 169.7, "r_x3": 436.5, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.7, "r_y0": 180.5, "r_x1": 464.1, "r_y1": 180.5, "r_x2": 464.1, "r_y2": 171.7, "r_x3": 442.7, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.3, "r_y0": 192.4, "r_x1": 224.8, "r_y1": 192.4, "r_x2": 224.8, "r_y2": 183.6, "r_x3": 139.3, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.8, "r_y0": 188.2, "r_x1": 242.9, "r_y1": 188.2, "r_x2": 242.9, "r_y2": 182.0, "r_x3": 224.8, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.9, "r_y0": 188.2, "r_x1": 249.2, "r_y1": 188.2, "r_x2": 249.2, "r_y2": 181.6, "r_x3": 242.9, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.2, "r_y0": 188.2, "r_x1": 265.1, "r_y1": 188.2, "r_x2": 265.1, "r_y2": 182.0, "r_x3": 249.2, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.1, "r_y0": 188.2, "r_x1": 271.3, "r_y1": 188.2, "r_x2": 271.3, "r_y2": 181.6, "r_x3": 265.1, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 188.2, "r_x1": 287.2, "r_y1": 188.2, "r_x2": 287.2, "r_y2": 182.0, "r_x3": 271.3, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.2, "r_y0": 188.2, "r_x1": 293.4, "r_y1": 188.2, "r_x2": 293.4, "r_y2": 181.6, "r_x3": 287.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.4, "r_x1": 404.2, "r_y1": 192.4, "r_x2": 404.2, "r_y2": 183.6, "r_x3": 293.4, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.2, "r_y0": 188.2, "r_x1": 410.4, "r_y1": 188.2, "r_x2": 410.4, "r_y2": 181.6, "r_x3": 404.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.4, "r_y0": 188.2, "r_x1": 426.3, "r_y1": 188.2, "r_x2": 426.3, "r_y2": 182.0, "r_x3": 410.4, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.3, "r_y0": 188.2, "r_x1": 432.5, "r_y1": 188.2, "r_x2": 432.5, "r_y2": 181.6, "r_x3": 426.3, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.2, "r_x1": 448.4, "r_y1": 188.2, "r_x2": 448.4, "r_y2": 182.0, "r_x3": 432.5, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.4, "r_y0": 188.2, "r_x1": 454.6, "r_y1": 188.2, "r_x2": 454.6, "r_y2": 181.6, "r_x3": 448.4, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.6, "r_y0": 192.4, "r_x1": 476.0, "r_y1": 192.4, "r_x2": 476.0, "r_y2": 183.6, "r_x3": 454.6, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.6, "r_y0": 200.2, "r_x1": 316.7, "r_y1": 200.2, "r_x2": 316.7, "r_y2": 194.0, "r_x3": 298.6, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.7, "r_y0": 200.2, "r_x1": 323.0, "r_y1": 200.2, "r_x2": 323.0, "r_y2": 193.6, "r_x3": 316.7, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.0, "r_y0": 200.2, "r_x1": 338.9, "r_y1": 200.2, "r_x2": 338.9, "r_y2": 194.0, "r_x3": 323.0, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.9, "r_y0": 200.2, "r_x1": 345.1, "r_y1": 200.2, "r_x2": 345.1, "r_y2": 193.6, "r_x3": 338.9, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.1, "r_y0": 200.2, "r_x1": 361.0, "r_y1": 200.2, "r_x2": 361.0, "r_y2": 194.0, "r_x3": 345.1, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.0, "r_y0": 200.2, "r_x1": 367.2, "r_y1": 200.2, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 361.0, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.2, "r_x1": 385.3, "r_y1": 200.2, "r_x2": 385.3, "r_y2": 194.0, "r_x3": 367.2, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 229.5, "t": 195.6, "r": 298.6, "b": 204.4, "coord_origin": "TOPLEFT" }, "confidence": 0.5, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.5, "r_y0": 204.4, "r_x1": 298.6, "r_y1": 204.4, "r_x2": 298.6, "r_y2": 195.6, "r_x3": 229.5, "r_y3": 195.6, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "text", "bbox": { "l": 279.1, "t": 217.2, "r": 336.3, "b": 225.3, "coord_origin": "TOPLEFT" }, "confidence": 0.63, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1, "r_y0": 225.3, "r_x1": 336.3, "r_y1": 225.3, "r_x2": 336.3, "r_y2": 217.2, "r_x3": 279.1, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "text", "bbox": { "l": 223.0, "t": 228.8, "r": 392.4, "b": 236.3, "coord_origin": "TOPLEFT" }, "confidence": 0.69, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.0, "r_y0": 236.3, "r_x1": 392.4, "r_y1": 236.3, "r_x2": 392.4, "r_y2": 228.8, "r_x3": 223.0, "r_y3": 228.8, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 1, "label": "text", "bbox": { "l": 163.1, "t": 270.3, "r": 452.2, "b": 464.7, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 278.2, "r_x1": 206.6, "r_y1": 278.2, "r_x2": 206.6, "r_y2": 270.3, "r_x3": 163.1, "r_y3": 270.3, "coord_origin": "TOPLEFT" }, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.6, "r_y0": 278.4, "r_x1": 452.2, "r_y1": 278.4, "r_x2": 452.2, "r_y2": 270.4, "r_x3": 211.6, "r_y3": 270.4, "coord_origin": "TOPLEFT" }, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 289.4, "r_x1": 452.2, "r_y1": 289.4, "r_x2": 452.2, "r_y2": 281.3, "r_x3": 163.1, "r_y3": 281.3, "coord_origin": "TOPLEFT" }, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 300.4, "r_x1": 452.2, "r_y1": 300.4, "r_x2": 452.2, "r_y2": 292.3, "r_x3": 163.1, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 311.3, "r_x1": 452.2, "r_y1": 311.3, "r_x2": 452.2, "r_y2": 303.2, "r_x3": 163.1, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 322.3, "r_x1": 452.2, "r_y1": 322.3, "r_x2": 452.2, "r_y2": 314.2, "r_x3": 163.1, "r_y3": 314.2, "coord_origin": "TOPLEFT" }, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 333.2, "r_x1": 452.2, "r_y1": 333.2, "r_x2": 452.2, "r_y2": 325.2, "r_x3": 163.1, "r_y3": 325.2, "coord_origin": "TOPLEFT" }, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 344.2, "r_x1": 452.2, "r_y1": 344.2, "r_x2": 452.2, "r_y2": 336.1, "r_x3": 163.1, "r_y3": 336.1, "coord_origin": "TOPLEFT" }, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 355.1, "r_x1": 452.2, "r_y1": 355.1, "r_x2": 452.2, "r_y2": 347.1, "r_x3": 163.1, "r_y3": 347.1, "coord_origin": "TOPLEFT" }, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 366.1, "r_x1": 452.2, "r_y1": 366.1, "r_x2": 452.2, "r_y2": 358.0, "r_x3": 163.1, "r_y3": 358.0, "coord_origin": "TOPLEFT" }, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 377.1, "r_x1": 452.2, "r_y1": 377.1, "r_x2": 452.2, "r_y2": 369.0, "r_x3": 163.1, "r_y3": 369.0, "coord_origin": "TOPLEFT" }, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 388.0, "r_x1": 452.2, "r_y1": 388.0, "r_x2": 452.2, "r_y2": 380.0, "r_x3": 163.1, "r_y3": 380.0, "coord_origin": "TOPLEFT" }, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 399.0, "r_x1": 452.2, "r_y1": 399.0, "r_x2": 452.2, "r_y2": 390.9, "r_x3": 163.1, "r_y3": 390.9, "coord_origin": "TOPLEFT" }, "text": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 409.9, "r_x1": 452.2, "r_y1": 409.9, "r_x2": 452.2, "r_y2": 401.9, "r_x3": 163.1, "r_y3": 401.9, "coord_origin": "TOPLEFT" }, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 420.9, "r_x1": 452.2, "r_y1": 420.9, "r_x2": 452.2, "r_y2": 412.8, "r_x3": 163.1, "r_y3": 412.8, "coord_origin": "TOPLEFT" }, "text": "accuracy improves significantly, inference time is halved compared to", "orig": "accuracy improves significantly, inference time is halved compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 431.9, "r_x1": 452.2, "r_y1": 431.9, "r_x2": 452.2, "r_y2": 423.8, "r_x3": 163.1, "r_y3": 423.8, "coord_origin": "TOPLEFT" }, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 442.8, "r_x1": 452.2, "r_y1": 442.8, "r_x2": 452.2, "r_y2": 434.7, "r_x3": 163.1, "r_y3": 434.7, "coord_origin": "TOPLEFT" }, "text": "tactically correct. This in turn eliminates most post-processing needs.", "orig": "tactically correct. This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 453.8, "r_x1": 452.2, "r_y1": 453.8, "r_x2": 452.2, "r_y2": 445.7, "r_x3": 163.1, "r_y3": 445.7, "coord_origin": "TOPLEFT" }, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 464.7, "r_x1": 225.6, "r_y1": 464.7, "r_x2": 225.6, "r_y2": 456.7, "r_x3": 163.1, "r_y3": 456.7, "coord_origin": "TOPLEFT" }, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 163.1, "t": 478.7, "r": 452.2, "b": 497.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 486.6, "r_x1": 211.9, "r_y1": 486.6, "r_x2": 211.9, "r_y2": 478.7, "r_x3": 163.1, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.6, "r_y0": 486.8, "r_x1": 452.2, "r_y1": 486.8, "r_x2": 452.2, "r_y2": 478.8, "r_x3": 216.6, "r_y3": 478.8, "coord_origin": "TOPLEFT" }, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 497.8, "r_x1": 257.6, "r_y1": 497.8, "r_x2": 257.6, "r_y2": 489.7, "r_x3": 163.1, "r_y3": 489.7, "coord_origin": "TOPLEFT" }, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "section_header", "bbox": { "l": 134.8, "t": 522.1, "r": 228.9, "b": 532.7, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 532.7, "r_x1": 141.5, "r_y1": 532.7, "r_x2": 141.5, "r_y2": 522.1, "r_x3": 134.8, "r_y3": 522.1, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 532.7, "r_x1": 228.9, "r_y1": 532.7, "r_x2": 228.9, "r_y2": 522.1, "r_x3": 154.9, "r_y3": 522.1, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 548.3, "r": 480.6, "b": 628.8, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.1, "r_x1": 480.6, "r_y1": 557.1, "r_x2": 480.6, "r_y2": 548.3, "r_x3": 134.8, "r_y3": 548.3, "coord_origin": "TOPLEFT" }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.0, "r_x1": 480.6, "r_y1": 569.0, "r_x2": 480.6, "r_y2": 560.2, "r_x3": 134.8, "r_y3": 560.2, "coord_origin": "TOPLEFT" }, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.0, "r_x1": 480.6, "r_y1": 581.0, "r_x2": 480.6, "r_y2": 572.2, "r_x3": 134.8, "r_y3": 572.2, "coord_origin": "TOPLEFT" }, "text": "valuable information and therefore need to be extracted with high accuracy.", "orig": "valuable information and therefore need to be extracted with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 592.9, "r_x1": 480.6, "r_y1": 592.9, "r_x2": 480.6, "r_y2": 584.2, "r_x3": 134.8, "r_y3": 584.2, "coord_origin": "TOPLEFT" }, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 604.9, "r_x1": 480.6, "r_y1": 604.9, "r_x2": 480.6, "r_y2": 596.1, "r_x3": 134.8, "r_y3": 596.1, "coord_origin": "TOPLEFT" }, "text": "ture, making it difficult to recover their correct structure with simple analyt-", "orig": "ture, making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 616.9, "r_x1": 480.6, "r_y1": 616.9, "r_x2": 480.6, "r_y2": 608.1, "r_x3": 134.8, "r_y3": 608.1, "coord_origin": "TOPLEFT" }, "text": "ical methods. Therefore, accurate table extraction is achieved these days with", "orig": "ical methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 628.8, "r_x1": 279.3, "r_y1": 628.8, "r_x2": 279.3, "r_y2": 620.0, "r_x3": 134.8, "r_y3": 620.0, "coord_origin": "TOPLEFT" }, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 632.1, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 149.7, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 18.3, "t": 209.5, "r": 36.3, "b": 555.0, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.3, "r_y0": 555.0, "r_x1": 36.3, "r_y1": 555.0, "r_x2": 36.3, "r_y2": 209.5, "r_x3": 18.3, "r_y3": 209.5, "coord_origin": "TOPLEFT" }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "orig": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "section_header", "id": 5, "page_no": 0, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.8, "t": 115.9, "r": 480.6, "b": 146.5, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 128.6, "r_x1": 480.6, "r_y1": 128.6, "r_x2": 480.6, "r_y2": 115.9, "r_x3": 134.8, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 266.7, "r_y0": 146.5, "r_x1": 348.7, "r_y1": 146.5, "r_x2": 348.7, "r_y2": 133.8, "r_x3": 266.7, "r_y3": 133.8, "coord_origin": "TOPLEFT" }, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "key_value_region", "id": 16, "page_no": 0, "cluster": { "id": 16, "label": "key_value_region", "bbox": { "l": 139.3, "t": 169.7, "r": 476.0, "b": 236.3, "coord_origin": "TOPLEFT" }, "confidence": 0.48, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.2, "r_y0": 180.5, "r_x1": 217.0, "r_y1": 180.5, "r_x2": 217.0, "r_y2": 171.7, "r_x3": 151.2, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.0, "r_y0": 176.3, "r_x1": 235.2, "r_y1": 176.3, "r_x2": 235.2, "r_y2": 170.1, "r_x3": 217.0, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.2, "r_y0": 176.3, "r_x1": 241.4, "r_y1": 176.3, "r_x2": 241.4, "r_y2": 169.7, "r_x3": 235.2, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.4, "r_y0": 176.3, "r_x1": 257.3, "r_y1": 176.3, "r_x2": 257.3, "r_y2": 170.1, "r_x3": 241.4, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.3, "r_x1": 263.5, "r_y1": 176.3, "r_x2": 263.5, "r_y2": 169.7, "r_x3": 257.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.5, "r_y0": 176.3, "r_x1": 279.4, "r_y1": 176.3, "r_x2": 279.4, "r_y2": 170.1, "r_x3": 263.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.4, "r_y0": 176.3, "r_x1": 285.6, "r_y1": 176.3, "r_x2": 285.6, "r_y2": 169.7, "r_x3": 279.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.6, "r_y0": 180.5, "r_x1": 392.3, "r_y1": 180.5, "r_x2": 392.3, "r_y2": 171.7, "r_x3": 285.6, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.3, "r_y0": 176.3, "r_x1": 398.5, "r_y1": 176.3, "r_x2": 398.5, "r_y2": 169.7, "r_x3": 392.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.3, "r_x1": 414.4, "r_y1": 176.3, "r_x2": 414.4, "r_y2": 170.1, "r_x3": 398.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.4, "r_y0": 176.3, "r_x1": 420.6, "r_y1": 176.3, "r_x2": 420.6, "r_y2": 169.7, "r_x3": 414.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.6, "r_y0": 176.3, "r_x1": 436.5, "r_y1": 176.3, "r_x2": 436.5, "r_y2": 170.1, "r_x3": 420.6, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.3, "r_x1": 442.7, "r_y1": 176.3, "r_x2": 442.7, "r_y2": 169.7, "r_x3": 436.5, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.7, "r_y0": 180.5, "r_x1": 464.1, "r_y1": 180.5, "r_x2": 464.1, "r_y2": 171.7, "r_x3": 442.7, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.3, "r_y0": 192.4, "r_x1": 224.8, "r_y1": 192.4, "r_x2": 224.8, "r_y2": 183.6, "r_x3": 139.3, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.8, "r_y0": 188.2, "r_x1": 242.9, "r_y1": 188.2, "r_x2": 242.9, "r_y2": 182.0, "r_x3": 224.8, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.9, "r_y0": 188.2, "r_x1": 249.2, "r_y1": 188.2, "r_x2": 249.2, "r_y2": 181.6, "r_x3": 242.9, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.2, "r_y0": 188.2, "r_x1": 265.1, "r_y1": 188.2, "r_x2": 265.1, "r_y2": 182.0, "r_x3": 249.2, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.1, "r_y0": 188.2, "r_x1": 271.3, "r_y1": 188.2, "r_x2": 271.3, "r_y2": 181.6, "r_x3": 265.1, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 188.2, "r_x1": 287.2, "r_y1": 188.2, "r_x2": 287.2, "r_y2": 182.0, "r_x3": 271.3, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.2, "r_y0": 188.2, "r_x1": 293.4, "r_y1": 188.2, "r_x2": 293.4, "r_y2": 181.6, "r_x3": 287.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.4, "r_x1": 404.2, "r_y1": 192.4, "r_x2": 404.2, "r_y2": 183.6, "r_x3": 293.4, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.2, "r_y0": 188.2, "r_x1": 410.4, "r_y1": 188.2, "r_x2": 410.4, "r_y2": 181.6, "r_x3": 404.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.4, "r_y0": 188.2, "r_x1": 426.3, "r_y1": 188.2, "r_x2": 426.3, "r_y2": 182.0, "r_x3": 410.4, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.3, "r_y0": 188.2, "r_x1": 432.5, "r_y1": 188.2, "r_x2": 432.5, "r_y2": 181.6, "r_x3": 426.3, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.2, "r_x1": 448.4, "r_y1": 188.2, "r_x2": 448.4, "r_y2": 182.0, "r_x3": 432.5, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.4, "r_y0": 188.2, "r_x1": 454.6, "r_y1": 188.2, "r_x2": 454.6, "r_y2": 181.6, "r_x3": 448.4, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.6, "r_y0": 192.4, "r_x1": 476.0, "r_y1": 192.4, "r_x2": 476.0, "r_y2": 183.6, "r_x3": 454.6, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.5, "r_y0": 204.4, "r_x1": 298.6, "r_y1": 204.4, "r_x2": 298.6, "r_y2": 195.6, "r_x3": 229.5, "r_y3": 195.6, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.6, "r_y0": 200.2, "r_x1": 316.7, "r_y1": 200.2, "r_x2": 316.7, "r_y2": 194.0, "r_x3": 298.6, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.7, "r_y0": 200.2, "r_x1": 323.0, "r_y1": 200.2, "r_x2": 323.0, "r_y2": 193.6, "r_x3": 316.7, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.0, "r_y0": 200.2, "r_x1": 338.9, "r_y1": 200.2, "r_x2": 338.9, "r_y2": 194.0, "r_x3": 323.0, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.9, "r_y0": 200.2, "r_x1": 345.1, "r_y1": 200.2, "r_x2": 345.1, "r_y2": 193.6, "r_x3": 338.9, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.1, "r_y0": 200.2, "r_x1": 361.0, "r_y1": 200.2, "r_x2": 361.0, "r_y2": 194.0, "r_x3": 345.1, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.0, "r_y0": 200.2, "r_x1": 367.2, "r_y1": 200.2, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 361.0, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.2, "r_x1": 385.3, "r_y1": 200.2, "r_x2": 385.3, "r_y2": 194.0, "r_x3": 367.2, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1, "r_y0": 225.3, "r_x1": 336.3, "r_y1": 225.3, "r_x2": 336.3, "r_y2": 217.2, "r_x3": 279.1, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.0, "r_y0": 236.3, "r_x1": 392.4, "r_y1": 236.3, "r_x2": 392.4, "r_y2": 228.8, "r_x3": 223.0, "r_y3": 228.8, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 139.3, "t": 169.7, "r": 476.0, "b": 200.2, "coord_origin": "TOPLEFT" }, "confidence": 0.79, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.2, "r_y0": 180.5, "r_x1": 217.0, "r_y1": 180.5, "r_x2": 217.0, "r_y2": 171.7, "r_x3": 151.2, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.0, "r_y0": 176.3, "r_x1": 235.2, "r_y1": 176.3, "r_x2": 235.2, "r_y2": 170.1, "r_x3": 217.0, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.2, "r_y0": 176.3, "r_x1": 241.4, "r_y1": 176.3, "r_x2": 241.4, "r_y2": 169.7, "r_x3": 235.2, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.4, "r_y0": 176.3, "r_x1": 257.3, "r_y1": 176.3, "r_x2": 257.3, "r_y2": 170.1, "r_x3": 241.4, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.3, "r_x1": 263.5, "r_y1": 176.3, "r_x2": 263.5, "r_y2": 169.7, "r_x3": 257.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.5, "r_y0": 176.3, "r_x1": 279.4, "r_y1": 176.3, "r_x2": 279.4, "r_y2": 170.1, "r_x3": 263.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.4, "r_y0": 176.3, "r_x1": 285.6, "r_y1": 176.3, "r_x2": 285.6, "r_y2": 169.7, "r_x3": 279.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.6, "r_y0": 180.5, "r_x1": 392.3, "r_y1": 180.5, "r_x2": 392.3, "r_y2": 171.7, "r_x3": 285.6, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.3, "r_y0": 176.3, "r_x1": 398.5, "r_y1": 176.3, "r_x2": 398.5, "r_y2": 169.7, "r_x3": 392.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.3, "r_x1": 414.4, "r_y1": 176.3, "r_x2": 414.4, "r_y2": 170.1, "r_x3": 398.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.4, "r_y0": 176.3, "r_x1": 420.6, "r_y1": 176.3, "r_x2": 420.6, "r_y2": 169.7, "r_x3": 414.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.6, "r_y0": 176.3, "r_x1": 436.5, "r_y1": 176.3, "r_x2": 436.5, "r_y2": 170.1, "r_x3": 420.6, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.3, "r_x1": 442.7, "r_y1": 176.3, "r_x2": 442.7, "r_y2": 169.7, "r_x3": 436.5, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.7, "r_y0": 180.5, "r_x1": 464.1, "r_y1": 180.5, "r_x2": 464.1, "r_y2": 171.7, "r_x3": 442.7, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.3, "r_y0": 192.4, "r_x1": 224.8, "r_y1": 192.4, "r_x2": 224.8, "r_y2": 183.6, "r_x3": 139.3, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.8, "r_y0": 188.2, "r_x1": 242.9, "r_y1": 188.2, "r_x2": 242.9, "r_y2": 182.0, "r_x3": 224.8, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.9, "r_y0": 188.2, "r_x1": 249.2, "r_y1": 188.2, "r_x2": 249.2, "r_y2": 181.6, "r_x3": 242.9, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.2, "r_y0": 188.2, "r_x1": 265.1, "r_y1": 188.2, "r_x2": 265.1, "r_y2": 182.0, "r_x3": 249.2, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.1, "r_y0": 188.2, "r_x1": 271.3, "r_y1": 188.2, "r_x2": 271.3, "r_y2": 181.6, "r_x3": 265.1, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 188.2, "r_x1": 287.2, "r_y1": 188.2, "r_x2": 287.2, "r_y2": 182.0, "r_x3": 271.3, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.2, "r_y0": 188.2, "r_x1": 293.4, "r_y1": 188.2, "r_x2": 293.4, "r_y2": 181.6, "r_x3": 287.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.4, "r_x1": 404.2, "r_y1": 192.4, "r_x2": 404.2, "r_y2": 183.6, "r_x3": 293.4, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.2, "r_y0": 188.2, "r_x1": 410.4, "r_y1": 188.2, "r_x2": 410.4, "r_y2": 181.6, "r_x3": 404.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.4, "r_y0": 188.2, "r_x1": 426.3, "r_y1": 188.2, "r_x2": 426.3, "r_y2": 182.0, "r_x3": 410.4, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.3, "r_y0": 188.2, "r_x1": 432.5, "r_y1": 188.2, "r_x2": 432.5, "r_y2": 181.6, "r_x3": 426.3, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.2, "r_x1": 448.4, "r_y1": 188.2, "r_x2": 448.4, "r_y2": 182.0, "r_x3": 432.5, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.4, "r_y0": 188.2, "r_x1": 454.6, "r_y1": 188.2, "r_x2": 454.6, "r_y2": 181.6, "r_x3": 448.4, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.6, "r_y0": 192.4, "r_x1": 476.0, "r_y1": 192.4, "r_x2": 476.0, "r_y2": 183.6, "r_x3": 454.6, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.6, "r_y0": 200.2, "r_x1": 316.7, "r_y1": 200.2, "r_x2": 316.7, "r_y2": 194.0, "r_x3": 298.6, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.7, "r_y0": 200.2, "r_x1": 323.0, "r_y1": 200.2, "r_x2": 323.0, "r_y2": 193.6, "r_x3": 316.7, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.0, "r_y0": 200.2, "r_x1": 338.9, "r_y1": 200.2, "r_x2": 338.9, "r_y2": 194.0, "r_x3": 323.0, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.9, "r_y0": 200.2, "r_x1": 345.1, "r_y1": 200.2, "r_x2": 345.1, "r_y2": 193.6, "r_x3": 338.9, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.1, "r_y0": 200.2, "r_x1": 361.0, "r_y1": 200.2, "r_x2": 361.0, "r_y2": 194.0, "r_x3": 345.1, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.0, "r_y0": 200.2, "r_x1": 367.2, "r_y1": 200.2, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 361.0, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.2, "r_x1": 385.3, "r_y1": 200.2, "r_x2": 385.3, "r_y2": 194.0, "r_x3": 367.2, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 229.5, "t": 195.6, "r": 298.6, "b": 204.4, "coord_origin": "TOPLEFT" }, "confidence": 0.5, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.5, "r_y0": 204.4, "r_x1": 298.6, "r_y1": 204.4, "r_x2": 298.6, "r_y2": 195.6, "r_x3": 229.5, "r_y3": 195.6, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "text", "bbox": { "l": 279.1, "t": 217.2, "r": 336.3, "b": 225.3, "coord_origin": "TOPLEFT" }, "confidence": 0.63, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1, "r_y0": 225.3, "r_x1": 336.3, "r_y1": 225.3, "r_x2": 336.3, "r_y2": 217.2, "r_x3": 279.1, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "text", "bbox": { "l": 223.0, "t": 228.8, "r": 392.4, "b": 236.3, "coord_origin": "TOPLEFT" }, "confidence": 0.69, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.0, "r_y0": 236.3, "r_x1": 392.4, "r_y1": 236.3, "r_x2": 392.4, "r_y2": 228.8, "r_x3": 223.0, "r_y3": 228.8, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null }, { "label": "text", "id": 1, "page_no": 0, "cluster": { "id": 1, "label": "text", "bbox": { "l": 163.1, "t": 270.3, "r": 452.2, "b": 464.7, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 278.2, "r_x1": 206.6, "r_y1": 278.2, "r_x2": 206.6, "r_y2": 270.3, "r_x3": 163.1, "r_y3": 270.3, "coord_origin": "TOPLEFT" }, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.6, "r_y0": 278.4, "r_x1": 452.2, "r_y1": 278.4, "r_x2": 452.2, "r_y2": 270.4, "r_x3": 211.6, "r_y3": 270.4, "coord_origin": "TOPLEFT" }, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 289.4, "r_x1": 452.2, "r_y1": 289.4, "r_x2": 452.2, "r_y2": 281.3, "r_x3": 163.1, "r_y3": 281.3, "coord_origin": "TOPLEFT" }, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 300.4, "r_x1": 452.2, "r_y1": 300.4, "r_x2": 452.2, "r_y2": 292.3, "r_x3": 163.1, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 311.3, "r_x1": 452.2, "r_y1": 311.3, "r_x2": 452.2, "r_y2": 303.2, "r_x3": 163.1, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 322.3, "r_x1": 452.2, "r_y1": 322.3, "r_x2": 452.2, "r_y2": 314.2, "r_x3": 163.1, "r_y3": 314.2, "coord_origin": "TOPLEFT" }, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 333.2, "r_x1": 452.2, "r_y1": 333.2, "r_x2": 452.2, "r_y2": 325.2, "r_x3": 163.1, "r_y3": 325.2, "coord_origin": "TOPLEFT" }, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 344.2, "r_x1": 452.2, "r_y1": 344.2, "r_x2": 452.2, "r_y2": 336.1, "r_x3": 163.1, "r_y3": 336.1, "coord_origin": "TOPLEFT" }, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 355.1, "r_x1": 452.2, "r_y1": 355.1, "r_x2": 452.2, "r_y2": 347.1, "r_x3": 163.1, "r_y3": 347.1, "coord_origin": "TOPLEFT" }, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 366.1, "r_x1": 452.2, "r_y1": 366.1, "r_x2": 452.2, "r_y2": 358.0, "r_x3": 163.1, "r_y3": 358.0, "coord_origin": "TOPLEFT" }, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 377.1, "r_x1": 452.2, "r_y1": 377.1, "r_x2": 452.2, "r_y2": 369.0, "r_x3": 163.1, "r_y3": 369.0, "coord_origin": "TOPLEFT" }, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 388.0, "r_x1": 452.2, "r_y1": 388.0, "r_x2": 452.2, "r_y2": 380.0, "r_x3": 163.1, "r_y3": 380.0, "coord_origin": "TOPLEFT" }, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 399.0, "r_x1": 452.2, "r_y1": 399.0, "r_x2": 452.2, "r_y2": 390.9, "r_x3": 163.1, "r_y3": 390.9, "coord_origin": "TOPLEFT" }, "text": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 409.9, "r_x1": 452.2, "r_y1": 409.9, "r_x2": 452.2, "r_y2": 401.9, "r_x3": 163.1, "r_y3": 401.9, "coord_origin": "TOPLEFT" }, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 420.9, "r_x1": 452.2, "r_y1": 420.9, "r_x2": 452.2, "r_y2": 412.8, "r_x3": 163.1, "r_y3": 412.8, "coord_origin": "TOPLEFT" }, "text": "accuracy improves significantly, inference time is halved compared to", "orig": "accuracy improves significantly, inference time is halved compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 431.9, "r_x1": 452.2, "r_y1": 431.9, "r_x2": 452.2, "r_y2": 423.8, "r_x3": 163.1, "r_y3": 423.8, "coord_origin": "TOPLEFT" }, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 442.8, "r_x1": 452.2, "r_y1": 442.8, "r_x2": 452.2, "r_y2": 434.7, "r_x3": 163.1, "r_y3": 434.7, "coord_origin": "TOPLEFT" }, "text": "tactically correct. This in turn eliminates most post-processing needs.", "orig": "tactically correct. This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 453.8, "r_x1": 452.2, "r_y1": 453.8, "r_x2": 452.2, "r_y2": 445.7, "r_x3": 163.1, "r_y3": 445.7, "coord_origin": "TOPLEFT" }, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 464.7, "r_x1": 225.6, "r_y1": 464.7, "r_x2": 225.6, "r_y2": 456.7, "r_x3": 163.1, "r_y3": 456.7, "coord_origin": "TOPLEFT" }, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Abstract. Extracting tables from documents is a crucial task in any document conversion pipeline. Recently, transformer-based models have demonstrated that table-structure can be recognized with impressive accuracy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking only the image of a table, such models predict a sequence of tokens (e.g. in HTML, LaTeX) which represent the structure of the table. Since the token representation of the table structure has a significant impact on the accuracy and run-time performance of any Im2Seq model, we investigate in this paper how table-structure representation can be optimised. We propose a new, optimised table-structure language (OTSL) with a minimized vocabulary and specific rules. The benefits of OTSL are that it reduces the number of tokens to 5 (HTML needs 28+) and shortens the sequence length to half of HTML on average. Consequently, model accuracy improves significantly, inference time is halved compared to HTML-based models, and the predicted table structures are always syntactically correct. This in turn eliminates most post-processing needs. Popular table structure data-sets will be published in OTSL format to the community." }, { "label": "text", "id": 4, "page_no": 0, "cluster": { "id": 4, "label": "text", "bbox": { "l": 163.1, "t": 478.7, "r": 452.2, "b": 497.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 486.6, "r_x1": 211.9, "r_y1": 486.6, "r_x2": 211.9, "r_y2": 478.7, "r_x3": 163.1, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.6, "r_y0": 486.8, "r_x1": 452.2, "r_y1": 486.8, "r_x2": 452.2, "r_y2": 478.8, "r_x3": 216.6, "r_y3": 478.8, "coord_origin": "TOPLEFT" }, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 497.8, "r_x1": 257.6, "r_y1": 497.8, "r_x2": 257.6, "r_y2": 489.7, "r_x3": 163.1, "r_y3": 489.7, "coord_origin": "TOPLEFT" }, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Keywords: Table Structure Recognition \u00b7 Data Representation \u00b7 Transformers \u00b7 Optimization." }, { "label": "section_header", "id": 3, "page_no": 0, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.8, "t": 522.1, "r": 228.9, "b": 532.7, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 532.7, "r_x1": 141.5, "r_y1": 532.7, "r_x2": 141.5, "r_y2": 522.1, "r_x3": 134.8, "r_y3": 522.1, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 532.7, "r_x1": 228.9, "r_y1": 532.7, "r_x2": 228.9, "r_y2": 522.1, "r_x3": 154.9, "r_y3": 522.1, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1 Introduction" }, { "label": "text", "id": 0, "page_no": 0, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 548.3, "r": 480.6, "b": 628.8, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.1, "r_x1": 480.6, "r_y1": 557.1, "r_x2": 480.6, "r_y2": 548.3, "r_x3": 134.8, "r_y3": 548.3, "coord_origin": "TOPLEFT" }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.0, "r_x1": 480.6, "r_y1": 569.0, "r_x2": 480.6, "r_y2": 560.2, "r_x3": 134.8, "r_y3": 560.2, "coord_origin": "TOPLEFT" }, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.0, "r_x1": 480.6, "r_y1": 581.0, "r_x2": 480.6, "r_y2": 572.2, "r_x3": 134.8, "r_y3": 572.2, "coord_origin": "TOPLEFT" }, "text": "valuable information and therefore need to be extracted with high accuracy.", "orig": "valuable information and therefore need to be extracted with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 592.9, "r_x1": 480.6, "r_y1": 592.9, "r_x2": 480.6, "r_y2": 584.2, "r_x3": 134.8, "r_y3": 584.2, "coord_origin": "TOPLEFT" }, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 604.9, "r_x1": 480.6, "r_y1": 604.9, "r_x2": 480.6, "r_y2": 596.1, "r_x3": 134.8, "r_y3": 596.1, "coord_origin": "TOPLEFT" }, "text": "ture, making it difficult to recover their correct structure with simple analyt-", "orig": "ture, making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 616.9, "r_x1": 480.6, "r_y1": 616.9, "r_x2": 480.6, "r_y2": 608.1, "r_x3": 134.8, "r_y3": 608.1, "coord_origin": "TOPLEFT" }, "text": "ical methods. Therefore, accurate table extraction is achieved these days with", "orig": "ical methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 628.8, "r_x1": 279.3, "r_y1": 628.8, "r_x2": 279.3, "r_y2": 620.0, "r_x3": 134.8, "r_y3": 620.0, "coord_origin": "TOPLEFT" }, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports, manuals, specification sheets or marketing material. They often encode highly valuable information and therefore need to be extracted with high accuracy. Unfortunately, tables appear in documents in various sizes, styling and structure, making it difficult to recover their correct structure with simple analytical methods. Therefore, accurate table extraction is achieved these days with machine-learning based methods." }, { "label": "text", "id": 2, "page_no": 0, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 632.1, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 149.7, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In modern document understanding systems [1,15], table extraction is typically a two-step process. Firstly, every table on a page is located with a bounding box, and secondly, their logical row and column structure is recognized. As of" }, { "label": "page_header", "id": 6, "page_no": 0, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 18.3, "t": 209.5, "r": 36.3, "b": 555.0, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.3, "r_y0": 555.0, "r_x1": 36.3, "r_y1": 555.0, "r_x2": 36.3, "r_y2": 209.5, "r_x3": 18.3, "r_y3": 209.5, "coord_origin": "TOPLEFT" }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "orig": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023" } ], "body": [ { "label": "section_header", "id": 5, "page_no": 0, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.8, "t": 115.9, "r": 480.6, "b": 146.5, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 128.6, "r_x1": 480.6, "r_y1": 128.6, "r_x2": 480.6, "r_y2": 115.9, "r_x3": 134.8, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 266.7, "r_y0": 146.5, "r_x1": 348.7, "r_y1": 146.5, "r_x2": 348.7, "r_y2": 133.8, "r_x3": 266.7, "r_y3": 133.8, "coord_origin": "TOPLEFT" }, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "key_value_region", "id": 16, "page_no": 0, "cluster": { "id": 16, "label": "key_value_region", "bbox": { "l": 139.3, "t": 169.7, "r": 476.0, "b": 236.3, "coord_origin": "TOPLEFT" }, "confidence": 0.48, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.2, "r_y0": 180.5, "r_x1": 217.0, "r_y1": 180.5, "r_x2": 217.0, "r_y2": 171.7, "r_x3": 151.2, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.0, "r_y0": 176.3, "r_x1": 235.2, "r_y1": 176.3, "r_x2": 235.2, "r_y2": 170.1, "r_x3": 217.0, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.2, "r_y0": 176.3, "r_x1": 241.4, "r_y1": 176.3, "r_x2": 241.4, "r_y2": 169.7, "r_x3": 235.2, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.4, "r_y0": 176.3, "r_x1": 257.3, "r_y1": 176.3, "r_x2": 257.3, "r_y2": 170.1, "r_x3": 241.4, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.3, "r_x1": 263.5, "r_y1": 176.3, "r_x2": 263.5, "r_y2": 169.7, "r_x3": 257.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.5, "r_y0": 176.3, "r_x1": 279.4, "r_y1": 176.3, "r_x2": 279.4, "r_y2": 170.1, "r_x3": 263.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.4, "r_y0": 176.3, "r_x1": 285.6, "r_y1": 176.3, "r_x2": 285.6, "r_y2": 169.7, "r_x3": 279.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.6, "r_y0": 180.5, "r_x1": 392.3, "r_y1": 180.5, "r_x2": 392.3, "r_y2": 171.7, "r_x3": 285.6, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.3, "r_y0": 176.3, "r_x1": 398.5, "r_y1": 176.3, "r_x2": 398.5, "r_y2": 169.7, "r_x3": 392.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.3, "r_x1": 414.4, "r_y1": 176.3, "r_x2": 414.4, "r_y2": 170.1, "r_x3": 398.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.4, "r_y0": 176.3, "r_x1": 420.6, "r_y1": 176.3, "r_x2": 420.6, "r_y2": 169.7, "r_x3": 414.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.6, "r_y0": 176.3, "r_x1": 436.5, "r_y1": 176.3, "r_x2": 436.5, "r_y2": 170.1, "r_x3": 420.6, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.3, "r_x1": 442.7, "r_y1": 176.3, "r_x2": 442.7, "r_y2": 169.7, "r_x3": 436.5, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.7, "r_y0": 180.5, "r_x1": 464.1, "r_y1": 180.5, "r_x2": 464.1, "r_y2": 171.7, "r_x3": 442.7, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.3, "r_y0": 192.4, "r_x1": 224.8, "r_y1": 192.4, "r_x2": 224.8, "r_y2": 183.6, "r_x3": 139.3, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.8, "r_y0": 188.2, "r_x1": 242.9, "r_y1": 188.2, "r_x2": 242.9, "r_y2": 182.0, "r_x3": 224.8, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.9, "r_y0": 188.2, "r_x1": 249.2, "r_y1": 188.2, "r_x2": 249.2, "r_y2": 181.6, "r_x3": 242.9, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.2, "r_y0": 188.2, "r_x1": 265.1, "r_y1": 188.2, "r_x2": 265.1, "r_y2": 182.0, "r_x3": 249.2, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.1, "r_y0": 188.2, "r_x1": 271.3, "r_y1": 188.2, "r_x2": 271.3, "r_y2": 181.6, "r_x3": 265.1, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 188.2, "r_x1": 287.2, "r_y1": 188.2, "r_x2": 287.2, "r_y2": 182.0, "r_x3": 271.3, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.2, "r_y0": 188.2, "r_x1": 293.4, "r_y1": 188.2, "r_x2": 293.4, "r_y2": 181.6, "r_x3": 287.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.4, "r_x1": 404.2, "r_y1": 192.4, "r_x2": 404.2, "r_y2": 183.6, "r_x3": 293.4, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.2, "r_y0": 188.2, "r_x1": 410.4, "r_y1": 188.2, "r_x2": 410.4, "r_y2": 181.6, "r_x3": 404.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.4, "r_y0": 188.2, "r_x1": 426.3, "r_y1": 188.2, "r_x2": 426.3, "r_y2": 182.0, "r_x3": 410.4, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.3, "r_y0": 188.2, "r_x1": 432.5, "r_y1": 188.2, "r_x2": 432.5, "r_y2": 181.6, "r_x3": 426.3, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.2, "r_x1": 448.4, "r_y1": 188.2, "r_x2": 448.4, "r_y2": 182.0, "r_x3": 432.5, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.4, "r_y0": 188.2, "r_x1": 454.6, "r_y1": 188.2, "r_x2": 454.6, "r_y2": 181.6, "r_x3": 448.4, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.6, "r_y0": 192.4, "r_x1": 476.0, "r_y1": 192.4, "r_x2": 476.0, "r_y2": 183.6, "r_x3": 454.6, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.5, "r_y0": 204.4, "r_x1": 298.6, "r_y1": 204.4, "r_x2": 298.6, "r_y2": 195.6, "r_x3": 229.5, "r_y3": 195.6, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.6, "r_y0": 200.2, "r_x1": 316.7, "r_y1": 200.2, "r_x2": 316.7, "r_y2": 194.0, "r_x3": 298.6, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.7, "r_y0": 200.2, "r_x1": 323.0, "r_y1": 200.2, "r_x2": 323.0, "r_y2": 193.6, "r_x3": 316.7, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.0, "r_y0": 200.2, "r_x1": 338.9, "r_y1": 200.2, "r_x2": 338.9, "r_y2": 194.0, "r_x3": 323.0, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.9, "r_y0": 200.2, "r_x1": 345.1, "r_y1": 200.2, "r_x2": 345.1, "r_y2": 193.6, "r_x3": 338.9, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.1, "r_y0": 200.2, "r_x1": 361.0, "r_y1": 200.2, "r_x2": 361.0, "r_y2": 194.0, "r_x3": 345.1, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.0, "r_y0": 200.2, "r_x1": 367.2, "r_y1": 200.2, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 361.0, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.2, "r_x1": 385.3, "r_y1": 200.2, "r_x2": 385.3, "r_y2": 194.0, "r_x3": 367.2, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1, "r_y0": 225.3, "r_x1": 336.3, "r_y1": 225.3, "r_x2": 336.3, "r_y2": 217.2, "r_x3": 279.1, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.0, "r_y0": 236.3, "r_x1": 392.4, "r_y1": 236.3, "r_x2": 392.4, "r_y2": 228.8, "r_x3": 223.0, "r_y3": 228.8, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 139.3, "t": 169.7, "r": 476.0, "b": 200.2, "coord_origin": "TOPLEFT" }, "confidence": 0.79, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.2, "r_y0": 180.5, "r_x1": 217.0, "r_y1": 180.5, "r_x2": 217.0, "r_y2": 171.7, "r_x3": 151.2, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.0, "r_y0": 176.3, "r_x1": 235.2, "r_y1": 176.3, "r_x2": 235.2, "r_y2": 170.1, "r_x3": 217.0, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.2, "r_y0": 176.3, "r_x1": 241.4, "r_y1": 176.3, "r_x2": 241.4, "r_y2": 169.7, "r_x3": 235.2, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.4, "r_y0": 176.3, "r_x1": 257.3, "r_y1": 176.3, "r_x2": 257.3, "r_y2": 170.1, "r_x3": 241.4, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.3, "r_x1": 263.5, "r_y1": 176.3, "r_x2": 263.5, "r_y2": 169.7, "r_x3": 257.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.5, "r_y0": 176.3, "r_x1": 279.4, "r_y1": 176.3, "r_x2": 279.4, "r_y2": 170.1, "r_x3": 263.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.4, "r_y0": 176.3, "r_x1": 285.6, "r_y1": 176.3, "r_x2": 285.6, "r_y2": 169.7, "r_x3": 279.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.6, "r_y0": 180.5, "r_x1": 392.3, "r_y1": 180.5, "r_x2": 392.3, "r_y2": 171.7, "r_x3": 285.6, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.3, "r_y0": 176.3, "r_x1": 398.5, "r_y1": 176.3, "r_x2": 398.5, "r_y2": 169.7, "r_x3": 392.3, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.3, "r_x1": 414.4, "r_y1": 176.3, "r_x2": 414.4, "r_y2": 170.1, "r_x3": 398.5, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.4, "r_y0": 176.3, "r_x1": 420.6, "r_y1": 176.3, "r_x2": 420.6, "r_y2": 169.7, "r_x3": 414.4, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.6, "r_y0": 176.3, "r_x1": 436.5, "r_y1": 176.3, "r_x2": 436.5, "r_y2": 170.1, "r_x3": 420.6, "r_y3": 170.1, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.3, "r_x1": 442.7, "r_y1": 176.3, "r_x2": 442.7, "r_y2": 169.7, "r_x3": 436.5, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.7, "r_y0": 180.5, "r_x1": 464.1, "r_y1": 180.5, "r_x2": 464.1, "r_y2": 171.7, "r_x3": 442.7, "r_y3": 171.7, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.3, "r_y0": 192.4, "r_x1": 224.8, "r_y1": 192.4, "r_x2": 224.8, "r_y2": 183.6, "r_x3": 139.3, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.8, "r_y0": 188.2, "r_x1": 242.9, "r_y1": 188.2, "r_x2": 242.9, "r_y2": 182.0, "r_x3": 224.8, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.9, "r_y0": 188.2, "r_x1": 249.2, "r_y1": 188.2, "r_x2": 249.2, "r_y2": 181.6, "r_x3": 242.9, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.2, "r_y0": 188.2, "r_x1": 265.1, "r_y1": 188.2, "r_x2": 265.1, "r_y2": 182.0, "r_x3": 249.2, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.1, "r_y0": 188.2, "r_x1": 271.3, "r_y1": 188.2, "r_x2": 271.3, "r_y2": 181.6, "r_x3": 265.1, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 188.2, "r_x1": 287.2, "r_y1": 188.2, "r_x2": 287.2, "r_y2": 182.0, "r_x3": 271.3, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.2, "r_y0": 188.2, "r_x1": 293.4, "r_y1": 188.2, "r_x2": 293.4, "r_y2": 181.6, "r_x3": 287.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.4, "r_x1": 404.2, "r_y1": 192.4, "r_x2": 404.2, "r_y2": 183.6, "r_x3": 293.4, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.2, "r_y0": 188.2, "r_x1": 410.4, "r_y1": 188.2, "r_x2": 410.4, "r_y2": 181.6, "r_x3": 404.2, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.4, "r_y0": 188.2, "r_x1": 426.3, "r_y1": 188.2, "r_x2": 426.3, "r_y2": 182.0, "r_x3": 410.4, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.3, "r_y0": 188.2, "r_x1": 432.5, "r_y1": 188.2, "r_x2": 432.5, "r_y2": 181.6, "r_x3": 426.3, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.2, "r_x1": 448.4, "r_y1": 188.2, "r_x2": 448.4, "r_y2": 182.0, "r_x3": 432.5, "r_y3": 182.0, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.4, "r_y0": 188.2, "r_x1": 454.6, "r_y1": 188.2, "r_x2": 454.6, "r_y2": 181.6, "r_x3": 448.4, "r_y3": 181.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.6, "r_y0": 192.4, "r_x1": 476.0, "r_y1": 192.4, "r_x2": 476.0, "r_y2": 183.6, "r_x3": 454.6, "r_y3": 183.6, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.6, "r_y0": 200.2, "r_x1": 316.7, "r_y1": 200.2, "r_x2": 316.7, "r_y2": 194.0, "r_x3": 298.6, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.7, "r_y0": 200.2, "r_x1": 323.0, "r_y1": 200.2, "r_x2": 323.0, "r_y2": 193.6, "r_x3": 316.7, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.0, "r_y0": 200.2, "r_x1": 338.9, "r_y1": 200.2, "r_x2": 338.9, "r_y2": 194.0, "r_x3": 323.0, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.9, "r_y0": 200.2, "r_x1": 345.1, "r_y1": 200.2, "r_x2": 345.1, "r_y2": 193.6, "r_x3": 338.9, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.1, "r_y0": 200.2, "r_x1": 361.0, "r_y1": 200.2, "r_x2": 361.0, "r_y2": 194.0, "r_x3": 345.1, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 361.0, "r_y0": 200.2, "r_x1": 367.2, "r_y1": 200.2, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 361.0, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.2, "r_x1": 385.3, "r_y1": 200.2, "r_x2": 385.3, "r_y2": 194.0, "r_x3": 367.2, "r_y3": 194.0, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 229.5, "t": 195.6, "r": 298.6, "b": 204.4, "coord_origin": "TOPLEFT" }, "confidence": 0.5, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.5, "r_y0": 204.4, "r_x1": 298.6, "r_y1": 204.4, "r_x2": 298.6, "r_y2": 195.6, "r_x3": 229.5, "r_y3": 195.6, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "text", "bbox": { "l": 279.1, "t": 217.2, "r": 336.3, "b": 225.3, "coord_origin": "TOPLEFT" }, "confidence": 0.63, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.1, "r_y0": 225.3, "r_x1": 336.3, "r_y1": 225.3, "r_x2": 336.3, "r_y2": 217.2, "r_x3": 279.1, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "text", "bbox": { "l": 223.0, "t": 228.8, "r": 392.4, "b": 236.3, "coord_origin": "TOPLEFT" }, "confidence": 0.69, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.0, "r_y0": 236.3, "r_x1": 392.4, "r_y1": 236.3, "r_x2": 392.4, "r_y2": 228.8, "r_x3": 223.0, "r_y3": 228.8, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null }, { "label": "text", "id": 1, "page_no": 0, "cluster": { "id": 1, "label": "text", "bbox": { "l": 163.1, "t": 270.3, "r": 452.2, "b": 464.7, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 278.2, "r_x1": 206.6, "r_y1": 278.2, "r_x2": 206.6, "r_y2": 270.3, "r_x3": 163.1, "r_y3": 270.3, "coord_origin": "TOPLEFT" }, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.6, "r_y0": 278.4, "r_x1": 452.2, "r_y1": 278.4, "r_x2": 452.2, "r_y2": 270.4, "r_x3": 211.6, "r_y3": 270.4, "coord_origin": "TOPLEFT" }, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 289.4, "r_x1": 452.2, "r_y1": 289.4, "r_x2": 452.2, "r_y2": 281.3, "r_x3": 163.1, "r_y3": 281.3, "coord_origin": "TOPLEFT" }, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 300.4, "r_x1": 452.2, "r_y1": 300.4, "r_x2": 452.2, "r_y2": 292.3, "r_x3": 163.1, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 311.3, "r_x1": 452.2, "r_y1": 311.3, "r_x2": 452.2, "r_y2": 303.2, "r_x3": 163.1, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 322.3, "r_x1": 452.2, "r_y1": 322.3, "r_x2": 452.2, "r_y2": 314.2, "r_x3": 163.1, "r_y3": 314.2, "coord_origin": "TOPLEFT" }, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 333.2, "r_x1": 452.2, "r_y1": 333.2, "r_x2": 452.2, "r_y2": 325.2, "r_x3": 163.1, "r_y3": 325.2, "coord_origin": "TOPLEFT" }, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 344.2, "r_x1": 452.2, "r_y1": 344.2, "r_x2": 452.2, "r_y2": 336.1, "r_x3": 163.1, "r_y3": 336.1, "coord_origin": "TOPLEFT" }, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 355.1, "r_x1": 452.2, "r_y1": 355.1, "r_x2": 452.2, "r_y2": 347.1, "r_x3": 163.1, "r_y3": 347.1, "coord_origin": "TOPLEFT" }, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 366.1, "r_x1": 452.2, "r_y1": 366.1, "r_x2": 452.2, "r_y2": 358.0, "r_x3": 163.1, "r_y3": 358.0, "coord_origin": "TOPLEFT" }, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 377.1, "r_x1": 452.2, "r_y1": 377.1, "r_x2": 452.2, "r_y2": 369.0, "r_x3": 163.1, "r_y3": 369.0, "coord_origin": "TOPLEFT" }, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 388.0, "r_x1": 452.2, "r_y1": 388.0, "r_x2": 452.2, "r_y2": 380.0, "r_x3": 163.1, "r_y3": 380.0, "coord_origin": "TOPLEFT" }, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 399.0, "r_x1": 452.2, "r_y1": 399.0, "r_x2": 452.2, "r_y2": 390.9, "r_x3": 163.1, "r_y3": 390.9, "coord_origin": "TOPLEFT" }, "text": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 409.9, "r_x1": 452.2, "r_y1": 409.9, "r_x2": 452.2, "r_y2": 401.9, "r_x3": 163.1, "r_y3": 401.9, "coord_origin": "TOPLEFT" }, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 420.9, "r_x1": 452.2, "r_y1": 420.9, "r_x2": 452.2, "r_y2": 412.8, "r_x3": 163.1, "r_y3": 412.8, "coord_origin": "TOPLEFT" }, "text": "accuracy improves significantly, inference time is halved compared to", "orig": "accuracy improves significantly, inference time is halved compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 431.9, "r_x1": 452.2, "r_y1": 431.9, "r_x2": 452.2, "r_y2": 423.8, "r_x3": 163.1, "r_y3": 423.8, "coord_origin": "TOPLEFT" }, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 442.8, "r_x1": 452.2, "r_y1": 442.8, "r_x2": 452.2, "r_y2": 434.7, "r_x3": 163.1, "r_y3": 434.7, "coord_origin": "TOPLEFT" }, "text": "tactically correct. This in turn eliminates most post-processing needs.", "orig": "tactically correct. This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 453.8, "r_x1": 452.2, "r_y1": 453.8, "r_x2": 452.2, "r_y2": 445.7, "r_x3": 163.1, "r_y3": 445.7, "coord_origin": "TOPLEFT" }, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 464.7, "r_x1": 225.6, "r_y1": 464.7, "r_x2": 225.6, "r_y2": 456.7, "r_x3": 163.1, "r_y3": 456.7, "coord_origin": "TOPLEFT" }, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Abstract. Extracting tables from documents is a crucial task in any document conversion pipeline. Recently, transformer-based models have demonstrated that table-structure can be recognized with impressive accuracy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking only the image of a table, such models predict a sequence of tokens (e.g. in HTML, LaTeX) which represent the structure of the table. Since the token representation of the table structure has a significant impact on the accuracy and run-time performance of any Im2Seq model, we investigate in this paper how table-structure representation can be optimised. We propose a new, optimised table-structure language (OTSL) with a minimized vocabulary and specific rules. The benefits of OTSL are that it reduces the number of tokens to 5 (HTML needs 28+) and shortens the sequence length to half of HTML on average. Consequently, model accuracy improves significantly, inference time is halved compared to HTML-based models, and the predicted table structures are always syntactically correct. This in turn eliminates most post-processing needs. Popular table structure data-sets will be published in OTSL format to the community." }, { "label": "text", "id": 4, "page_no": 0, "cluster": { "id": 4, "label": "text", "bbox": { "l": 163.1, "t": 478.7, "r": 452.2, "b": 497.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 486.6, "r_x1": 211.9, "r_y1": 486.6, "r_x2": 211.9, "r_y2": 478.7, "r_x3": 163.1, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.6, "r_y0": 486.8, "r_x1": 452.2, "r_y1": 486.8, "r_x2": 452.2, "r_y2": 478.8, "r_x3": 216.6, "r_y3": 478.8, "coord_origin": "TOPLEFT" }, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.1, "r_y0": 497.8, "r_x1": 257.6, "r_y1": 497.8, "r_x2": 257.6, "r_y2": 489.7, "r_x3": 163.1, "r_y3": 489.7, "coord_origin": "TOPLEFT" }, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Keywords: Table Structure Recognition \u00b7 Data Representation \u00b7 Transformers \u00b7 Optimization." }, { "label": "section_header", "id": 3, "page_no": 0, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.8, "t": 522.1, "r": 228.9, "b": 532.7, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 532.7, "r_x1": 141.5, "r_y1": 532.7, "r_x2": 141.5, "r_y2": 522.1, "r_x3": 134.8, "r_y3": 522.1, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 532.7, "r_x1": 228.9, "r_y1": 532.7, "r_x2": 228.9, "r_y2": 522.1, "r_x3": 154.9, "r_y3": 522.1, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1 Introduction" }, { "label": "text", "id": 0, "page_no": 0, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 548.3, "r": 480.6, "b": 628.8, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.1, "r_x1": 480.6, "r_y1": 557.1, "r_x2": 480.6, "r_y2": 548.3, "r_x3": 134.8, "r_y3": 548.3, "coord_origin": "TOPLEFT" }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.0, "r_x1": 480.6, "r_y1": 569.0, "r_x2": 480.6, "r_y2": 560.2, "r_x3": 134.8, "r_y3": 560.2, "coord_origin": "TOPLEFT" }, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.0, "r_x1": 480.6, "r_y1": 581.0, "r_x2": 480.6, "r_y2": 572.2, "r_x3": 134.8, "r_y3": 572.2, "coord_origin": "TOPLEFT" }, "text": "valuable information and therefore need to be extracted with high accuracy.", "orig": "valuable information and therefore need to be extracted with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 592.9, "r_x1": 480.6, "r_y1": 592.9, "r_x2": 480.6, "r_y2": 584.2, "r_x3": 134.8, "r_y3": 584.2, "coord_origin": "TOPLEFT" }, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 604.9, "r_x1": 480.6, "r_y1": 604.9, "r_x2": 480.6, "r_y2": 596.1, "r_x3": 134.8, "r_y3": 596.1, "coord_origin": "TOPLEFT" }, "text": "ture, making it difficult to recover their correct structure with simple analyt-", "orig": "ture, making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 616.9, "r_x1": 480.6, "r_y1": 616.9, "r_x2": 480.6, "r_y2": 608.1, "r_x3": 134.8, "r_y3": 608.1, "coord_origin": "TOPLEFT" }, "text": "ical methods. Therefore, accurate table extraction is achieved these days with", "orig": "ical methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 628.8, "r_x1": 279.3, "r_y1": 628.8, "r_x2": 279.3, "r_y2": 620.0, "r_x3": 134.8, "r_y3": 620.0, "coord_origin": "TOPLEFT" }, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports, manuals, specification sheets or marketing material. They often encode highly valuable information and therefore need to be extracted with high accuracy. Unfortunately, tables appear in documents in various sizes, styling and structure, making it difficult to recover their correct structure with simple analytical methods. Therefore, accurate table extraction is achieved these days with machine-learning based methods." }, { "label": "text", "id": 2, "page_no": 0, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 632.1, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 149.7, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In modern document understanding systems [1,15], table extraction is typically a two-step process. Firstly, every table on a page is located with a bounding box, and secondly, their logical row and column structure is recognized. As of" } ], "headers": [ { "label": "page_header", "id": 6, "page_no": 0, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 18.3, "t": 209.5, "r": 36.3, "b": 555.0, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.3, "r_y0": 555.0, "r_x1": 36.3, "r_y1": 555.0, "r_x2": 36.3, "r_y2": 209.5, "r_x3": 18.3, "r_y3": 209.5, "coord_origin": "TOPLEFT" }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "orig": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023" } ] } }, { "page_no": 1, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 134.3, "r_x1": 162.6, "r_y1": 134.3, "r_x2": 162.6, "r_y2": 126.3, "r_x3": 134.8, "r_y3": 126.3, "coord_origin": "TOPLEFT" }, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.1, "r_y0": 134.5, "r_x1": 480.6, "r_y1": 134.5, "r_x2": 480.6, "r_y2": 126.4, "r_x3": 167.1, "r_y3": 126.4, "coord_origin": "TOPLEFT" }, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 145.4, "r_x1": 480.6, "r_y1": 145.4, "r_x2": 480.6, "r_y2": 137.4, "r_x3": 134.8, "r_y3": 137.4, "coord_origin": "TOPLEFT" }, "text": "table-example with complex row and column headers, including a 2D empty span,", "orig": "table-example with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 156.4, "r_x1": 148.0, "r_y1": 156.4, "r_x2": 148.0, "r_y2": 148.3, "r_x3": 134.8, "r_y3": 148.3, "coord_origin": "TOPLEFT" }, "text": "(B)", "orig": "(B)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.4, "r_y0": 156.4, "r_x1": 480.6, "r_y1": 156.4, "r_x2": 480.6, "r_y2": 148.3, "r_x3": 152.4, "r_y3": 148.3, "coord_origin": "TOPLEFT" }, "text": "minimal graphical representation of table structure using rectangular layout, (C)", "orig": "minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 167.3, "r_x1": 480.6, "r_y1": 167.3, "r_x2": 480.6, "r_y2": 159.3, "r_x3": 134.8, "r_y3": 159.3, "coord_origin": "TOPLEFT" }, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 178.3, "r_x1": 480.6, "r_y1": 178.3, "r_x2": 480.6, "r_y2": 170.2, "r_x3": 134.8, "r_y3": 170.2, "coord_origin": "TOPLEFT" }, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 189.3, "r_x1": 480.6, "r_y1": 189.3, "r_x2": 480.6, "r_y2": 181.2, "r_x3": 134.8, "r_y3": 181.2, "coord_origin": "TOPLEFT" }, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 200.2, "r_x1": 460.9, "r_y1": 200.2, "r_x2": 460.9, "r_y2": 192.2, "r_x3": 134.8, "r_y3": 192.2, "coord_origin": "TOPLEFT" }, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.4, "r_y0": 289.5, "r_x1": 403.0, "r_y1": 289.5, "r_x2": 403.0, "r_y2": 281.0, "r_x3": 396.4, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 289.4, "r_x1": 425.1, "r_y1": 289.4, "r_x2": 425.1, "r_y2": 280.9, "r_x3": 418.6, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.7, "r_y0": 311.8, "r_x1": 402.3, "r_y1": 311.8, "r_x2": 402.3, "r_y2": 303.2, "r_x3": 395.7, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.5, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.4, "r_x3": 407.5, "r_y3": 303.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.6, "r_y0": 322.9, "r_x1": 414.1, "r_y1": 322.9, "r_x2": 414.1, "r_y2": 314.4, "r_x3": 407.6, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 300.6, "r_x1": 425.1, "r_y1": 300.6, "r_x2": 425.1, "r_y2": 292.1, "r_x3": 418.5, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.6, "r_x1": 436.2, "r_y1": 300.6, "r_x2": 436.2, "r_y2": 292.1, "r_x3": 429.6, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7, "r_y0": 300.5, "r_x1": 447.2, "r_y1": 300.5, "r_x2": 447.2, "r_y2": 292.0, "r_x3": 440.7, "r_y3": 292.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 311.8, "r_x1": 425.2, "r_y1": 311.8, "r_x2": 425.2, "r_y2": 303.3, "r_x3": 418.6, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 311.8, "r_x1": 436.3, "r_y1": 311.8, "r_x2": 436.3, "r_y2": 303.3, "r_x3": 429.7, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.7, "r_x1": 447.4, "r_y1": 311.7, "r_x2": 447.4, "r_y2": 303.2, "r_x3": 440.8, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 323.1, "r_x1": 425.2, "r_y1": 323.1, "r_x2": 425.2, "r_y2": 314.6, "r_x3": 418.6, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 323.1, "r_x1": 436.3, "r_y1": 323.1, "r_x2": 436.3, "r_y2": 314.6, "r_x3": 429.7, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.0, "r_x1": 447.4, "r_y1": 323.0, "r_x2": 447.4, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.8, "r_x1": 414.0, "r_y1": 333.8, "r_x2": 414.0, "r_y2": 325.3, "r_x3": 407.4, "r_y3": 325.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 334.0, "r_x1": 425.0, "r_y1": 334.0, "r_x2": 425.0, "r_y2": 325.5, "r_x3": 418.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.5, "r_y0": 334.0, "r_x1": 436.1, "r_y1": 334.0, "r_x2": 436.1, "r_y2": 325.5, "r_x3": 429.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.6, "r_y0": 333.9, "r_x1": 447.2, "r_y1": 333.9, "r_x2": 447.2, "r_y2": 325.4, "r_x3": 440.6, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.7, "r_x1": 463.5, "r_y1": 288.7, "r_x2": 463.5, "r_y2": 280.2, "r_x3": 451.9, "r_y3": 280.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 300.1, "r_x1": 463.8, "r_y1": 300.1, "r_x2": 463.8, "r_y2": 291.6, "r_x3": 452.2, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 311.4, "r_x1": 463.8, "r_y1": 311.4, "r_x2": 463.8, "r_y2": 302.8, "r_x3": 452.2, "r_y3": 302.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.6, "r_x1": 463.7, "r_y1": 322.6, "r_x2": 463.7, "r_y2": 314.1, "r_x3": 452.1, "r_y3": 314.1, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 334.0, "r_x1": 463.9, "r_y1": 334.0, "r_x2": 463.9, "r_y2": 325.5, "r_x3": 452.3, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.0, "r_x1": 402.7, "r_y1": 323.0, "r_x2": 402.7, "r_y2": 314.5, "r_x3": 396.1, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.9, "r_x1": 402.6, "r_y1": 333.9, "r_x2": 402.6, "r_y2": 325.4, "r_x3": 396.0, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 300.8, "r_x1": 402.8, "r_y1": 300.8, "r_x2": 402.8, "r_y2": 292.3, "r_x3": 396.3, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.5, "r_y0": 289.5, "r_x1": 413.6, "r_y1": 289.5, "r_x2": 413.6, "r_y2": 281.0, "r_x3": 408.5, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.6, "r_y0": 289.0, "r_x1": 435.6, "r_y1": 289.0, "r_x2": 435.6, "r_y2": 280.5, "r_x3": 430.6, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.1, "r_y0": 288.9, "r_x1": 446.1, "r_y1": 288.9, "r_x2": 446.1, "r_y2": 280.4, "r_x3": 441.1, "r_y3": 280.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.0, "r_y0": 300.7, "r_x1": 414.0, "r_y1": 300.7, "r_x2": 414.0, "r_y2": 292.1, "r_x3": 408.0, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.3, "r_y0": 419.7, "r_x1": 452.9, "r_y1": 419.7, "r_x2": 452.9, "r_y2": 411.2, "r_x3": 441.3, "r_y3": 411.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 406.9, "r_x1": 432.5, "r_y1": 406.9, "r_x2": 432.5, "r_y2": 399.8, "r_x3": 393.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.6, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.8, "r_x3": 434.6, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.9, "r_y0": 406.9, "r_x1": 463.2, "r_y1": 406.9, "r_x2": 463.2, "r_y2": 399.8, "r_x3": 440.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.1, "r_y0": 265.7, "r_x1": 414.0, "r_y1": 265.7, "r_x2": 414.0, "r_y2": 258.5, "r_x3": 384.1, "r_y3": 258.5, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 273.8, "r_x1": 451.5, "r_y1": 273.8, "r_x2": 451.5, "r_y2": 266.7, "r_x3": 393.8, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.6, "r_y0": 273.8, "r_x1": 462.0, "r_y1": 273.8, "r_x2": 462.0, "r_y2": 266.7, "r_x3": 453.6, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.8, "r_y0": 406.9, "r_x1": 233.9, "r_y1": 406.9, "r_x2": 233.9, "r_y2": 399.8, "r_x3": 151.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.0, "r_y0": 406.9, "r_x1": 244.4, "r_y1": 406.9, "r_x2": 244.4, "r_y2": 399.8, "r_x3": 236.0, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.5, "r_y0": 406.9, "r_x1": 268.8, "r_y1": 406.9, "r_x2": 268.8, "r_y2": 399.8, "r_x3": 246.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3, "r_y0": 220.7, "r_x1": 159.8, "r_y1": 220.7, "r_x2": 159.8, "r_y2": 213.6, "r_x3": 154.3, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.1, "r_y0": 220.7, "r_x1": 326.5, "r_y1": 220.7, "r_x2": 326.5, "r_y2": 213.6, "r_x3": 321.1, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 286.7, "r_x1": 175.8, "r_y1": 286.7, "r_x2": 175.8, "r_y2": 280.3, "r_x3": 153.1, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 293.5, "r_x1": 172.8, "r_y1": 293.5, "r_x2": 172.8, "r_y2": 287.1, "r_x3": 160.7, "r_y3": 287.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 300.3, "r_x1": 177.9, "r_y1": 300.3, "r_x2": 177.9, "r_y2": 293.9, "r_x3": 168.2, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.4, "r_y0": 300.3, "r_x1": 278.9, "r_y1": 300.3, "r_x2": 278.9, "r_y2": 293.9, "r_x3": 263.4, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.8, "r_y0": 300.3, "r_x1": 290.5, "r_y1": 300.3, "r_x2": 290.5, "r_y2": 293.9, "r_x3": 280.8, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.9, "r_y0": 300.3, "r_x1": 351.5, "r_y1": 300.3, "r_x2": 351.5, "r_y2": 293.9, "r_x3": 335.9, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 307.1, "r_x1": 174.7, "r_y1": 307.1, "r_x2": 174.7, "r_y2": 300.8, "r_x3": 160.7, "r_y3": 300.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 314.0, "r_x1": 172.8, "r_y1": 314.0, "r_x2": 172.8, "r_y2": 307.6, "r_x3": 160.7, "r_y3": 307.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 320.8, "r_x1": 181.9, "r_y1": 320.8, "r_x2": 181.9, "r_y2": 314.4, "r_x3": 168.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 320.8, "r_x1": 214.9, "r_y1": 320.8, "r_x2": 214.9, "r_y2": 314.4, "r_x3": 201.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 320.8, "r_x1": 247.8, "r_y1": 320.8, "r_x2": 247.8, "r_y2": 314.4, "r_x3": 234.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 327.6, "r_x1": 174.7, "r_y1": 327.6, "r_x2": 174.7, "r_y2": 321.2, "r_x3": 160.7, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 334.4, "r_x1": 172.8, "r_y1": 334.4, "r_x2": 172.8, "r_y2": 328.0, "r_x3": 160.7, "r_y3": 328.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 341.2, "r_x1": 373.1, "r_y1": 341.2, "r_x2": 373.1, "r_y2": 334.8, "r_x3": 168.2, "r_y3": 334.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 348.0, "r_x1": 174.7, "r_y1": 348.0, "r_x2": 174.7, "r_y2": 341.7, "r_x3": 160.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 354.9, "r_x1": 172.8, "r_y1": 354.9, "r_x2": 172.8, "r_y2": 348.5, "r_x3": 160.7, "r_y3": 348.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 361.7, "r_x1": 181.9, "r_y1": 361.7, "r_x2": 181.9, "r_y2": 355.3, "r_x3": 168.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 361.7, "r_x1": 214.9, "r_y1": 361.7, "r_x2": 214.9, "r_y2": 355.3, "r_x3": 201.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 361.7, "r_x1": 247.8, "r_y1": 361.7, "r_x2": 247.8, "r_y2": 355.3, "r_x3": 234.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 361.7, "r_x1": 280.8, "r_y1": 361.7, "r_x2": 280.8, "r_y2": 355.3, "r_x3": 267.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 368.5, "r_x1": 174.7, "r_y1": 368.5, "r_x2": 174.7, "r_y2": 362.1, "r_x3": 160.7, "r_y3": 362.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 375.3, "r_x1": 172.8, "r_y1": 375.3, "r_x2": 172.8, "r_y2": 368.9, "r_x3": 160.7, "r_y3": 368.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 382.1, "r_x1": 181.9, "r_y1": 382.1, "r_x2": 181.9, "r_y2": 375.7, "r_x3": 168.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 382.1, "r_x1": 214.9, "r_y1": 382.1, "r_x2": 214.9, "r_y2": 375.7, "r_x3": 201.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 382.1, "r_x1": 247.8, "r_y1": 382.1, "r_x2": 247.8, "r_y2": 375.7, "r_x3": 234.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 382.1, "r_x1": 280.8, "r_y1": 382.1, "r_x2": 280.8, "r_y2": 375.7, "r_x3": 267.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 388.9, "r_x1": 174.7, "r_y1": 388.9, "r_x2": 174.7, "r_y2": 382.6, "r_x3": 160.7, "r_y3": 382.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 395.8, "r_x1": 177.7, "r_y1": 395.8, "r_x2": 177.7, "r_y2": 389.4, "r_x3": 153.1, "r_y3": 389.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 320.8, "r_x1": 199.3, "r_y1": 320.8, "r_x2": 199.3, "r_y2": 314.4, "r_x3": 183.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 320.8, "r_x1": 232.3, "r_y1": 320.8, "r_x2": 232.3, "r_y2": 314.4, "r_x3": 216.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 320.8, "r_x1": 265.3, "r_y1": 320.8, "r_x2": 265.3, "r_y2": 314.4, "r_x3": 249.7, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 361.7, "r_x1": 199.3, "r_y1": 361.7, "r_x2": 199.3, "r_y2": 355.3, "r_x3": 183.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 361.7, "r_x1": 232.3, "r_y1": 361.7, "r_x2": 232.3, "r_y2": 355.3, "r_x3": 216.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 361.7, "r_x1": 265.3, "r_y1": 361.7, "r_x2": 265.3, "r_y2": 355.3, "r_x3": 249.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 361.7, "r_x1": 298.2, "r_y1": 361.7, "r_x2": 298.2, "r_y2": 355.3, "r_x3": 282.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 382.1, "r_x1": 199.3, "r_y1": 382.1, "r_x2": 199.3, "r_y2": 375.7, "r_x3": 183.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 382.1, "r_x1": 232.3, "r_y1": 382.1, "r_x2": 232.3, "r_y2": 375.7, "r_x3": 216.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 382.1, "r_x1": 265.3, "r_y1": 382.1, "r_x2": 265.3, "r_y2": 375.7, "r_x3": 249.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 382.1, "r_x1": 298.2, "r_y1": 382.1, "r_x2": 298.2, "r_y2": 375.7, "r_x3": 282.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.1, "r_y0": 419.9, "r_x1": 401.6, "r_y1": 419.9, "r_x2": 401.6, "r_y2": 411.3, "r_x3": 395.1, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 419.9, "r_x1": 412.5, "r_y1": 419.9, "r_x2": 412.5, "r_y2": 411.3, "r_x3": 407.4, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.7, "r_y0": 419.9, "r_x1": 425.3, "r_y1": 419.9, "r_x2": 425.3, "r_y2": 411.3, "r_x3": 418.7, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5, "r_y0": 419.9, "r_x1": 436.6, "r_y1": 419.9, "r_x2": 436.6, "r_y2": 411.3, "r_x3": 430.5, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.4, "r_y0": 416.2, "r_x1": 175.1, "r_y1": 416.2, "r_x2": 175.1, "r_y2": 409.8, "r_x3": 152.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.9, "r_y0": 416.2, "r_x1": 191.0, "r_y1": 416.2, "r_x2": 191.0, "r_y2": 409.8, "r_x3": 178.9, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.8, "r_y0": 416.2, "r_x1": 208.8, "r_y1": 416.2, "r_x2": 208.8, "r_y2": 409.8, "r_x3": 194.8, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.6, "r_y0": 416.2, "r_x1": 226.3, "r_y1": 416.2, "r_x2": 226.3, "r_y2": 409.8, "r_x3": 212.6, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.4, "r_y0": 416.2, "r_x1": 259.0, "r_y1": 416.2, "r_x2": 259.0, "r_y2": 409.8, "r_x3": 249.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.5, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.1, "r_x3": 244.5, "r_y3": 418.1, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.0, "r_y0": 416.2, "r_x1": 245.6, "r_y1": 416.2, "r_x2": 245.6, "r_y2": 409.8, "r_x3": 230.0, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 265.7, "r_x1": 159.6, "r_y1": 265.7, "r_x2": 159.6, "r_y2": 258.6, "r_x3": 154.5, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.7, "r_y0": 265.7, "r_x1": 185.2, "r_y1": 265.7, "r_x2": 185.2, "r_y2": 258.6, "r_x3": 164.7, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.4, "r_y0": 273.6, "r_x1": 222.1, "r_y1": 273.6, "r_x2": 222.1, "r_y2": 266.5, "r_x3": 164.4, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.2, "r_y0": 273.6, "r_x1": 232.6, "r_y1": 273.6, "r_x2": 232.6, "r_y2": 266.5, "r_x3": 224.2, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 461.1, "r_x1": 161.3, "r_y1": 461.1, "r_x2": 161.3, "r_y2": 452.3, "r_x3": 134.8, "r_y3": 452.3, "coord_origin": "TOPLEFT" }, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.3, "r_y0": 461.1, "r_x1": 226.3, "r_y1": 461.1, "r_x2": 226.3, "r_y2": 452.3, "r_x3": 164.3, "r_y3": 452.3, "coord_origin": "TOPLEFT" }, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.0, "r_y0": 461.1, "r_x1": 480.6, "r_y1": 461.1, "r_x2": 480.6, "r_y2": 452.3, "r_x3": 230.0, "r_y3": 452.3, "coord_origin": "TOPLEFT" }, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 473.1, "r_x1": 480.6, "r_y1": 473.1, "r_x2": 480.6, "r_y2": 464.3, "r_x3": 134.8, "r_y3": 464.3, "coord_origin": "TOPLEFT" }, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 485.0, "r_x1": 480.6, "r_y1": 485.0, "r_x2": 480.6, "r_y2": 476.2, "r_x3": 134.8, "r_y3": 476.2, "coord_origin": "TOPLEFT" }, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 497.0, "r_x1": 480.6, "r_y1": 497.0, "r_x2": 480.6, "r_y2": 488.2, "r_x3": 134.8, "r_y3": 488.2, "coord_origin": "TOPLEFT" }, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 508.9, "r_x1": 480.6, "r_y1": 508.9, "r_x2": 480.6, "r_y2": 500.1, "r_x3": 134.8, "r_y3": 500.1, "coord_origin": "TOPLEFT" }, "text": "area of research, in which many novel machine learning algorithms are being", "orig": "area of research, in which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 520.9, "r_x1": 313.2, "r_y1": 520.9, "r_x2": 313.2, "r_y2": 512.1, "r_x3": 134.8, "r_y3": 512.1, "coord_origin": "TOPLEFT" }, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.6, "r_x3": 149.7, "r_y3": 524.6, "coord_origin": "TOPLEFT" }, "text": "Recently emerging SOTA methods for table structure recognition employ", "orig": "Recently emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 480.6, "r_y1": 581.2, "r_x2": 480.6, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 421.5, "r_y1": 664.9, "r_x2": 421.5, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 139.4, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.91, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "caption", "bbox": { "l": 134.8, "t": 126.3, "r": 480.6, "b": 200.2, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 134.3, "r_x1": 162.6, "r_y1": 134.3, "r_x2": 162.6, "r_y2": 126.3, "r_x3": 134.8, "r_y3": 126.3, "coord_origin": "TOPLEFT" }, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.1, "r_y0": 134.5, "r_x1": 480.6, "r_y1": 134.5, "r_x2": 480.6, "r_y2": 126.4, "r_x3": 167.1, "r_y3": 126.4, "coord_origin": "TOPLEFT" }, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 145.4, "r_x1": 480.6, "r_y1": 145.4, "r_x2": 480.6, "r_y2": 137.4, "r_x3": 134.8, "r_y3": 137.4, "coord_origin": "TOPLEFT" }, "text": "table-example with complex row and column headers, including a 2D empty span,", "orig": "table-example with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 156.4, "r_x1": 148.0, "r_y1": 156.4, "r_x2": 148.0, "r_y2": 148.3, "r_x3": 134.8, "r_y3": 148.3, "coord_origin": "TOPLEFT" }, "text": "(B)", "orig": "(B)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.4, "r_y0": 156.4, "r_x1": 480.6, "r_y1": 156.4, "r_x2": 480.6, "r_y2": 148.3, "r_x3": 152.4, "r_y3": 148.3, "coord_origin": "TOPLEFT" }, "text": "minimal graphical representation of table structure using rectangular layout, (C)", "orig": "minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 167.3, "r_x1": 480.6, "r_y1": 167.3, "r_x2": 480.6, "r_y2": 159.3, "r_x3": 134.8, "r_y3": 159.3, "coord_origin": "TOPLEFT" }, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 178.3, "r_x1": 480.6, "r_y1": 178.3, "r_x2": 480.6, "r_y2": 170.2, "r_x3": 134.8, "r_y3": 170.2, "coord_origin": "TOPLEFT" }, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 189.3, "r_x1": 480.6, "r_y1": 189.3, "r_x2": 480.6, "r_y2": 181.2, "r_x3": 134.8, "r_y3": 181.2, "coord_origin": "TOPLEFT" }, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 200.2, "r_x1": 460.9, "r_y1": 200.2, "r_x2": 460.9, "r_y2": 192.2, "r_x3": 134.8, "r_y3": 192.2, "coord_origin": "TOPLEFT" }, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "picture", "bbox": { "l": 148.5, "t": 208.4, "r": 464.4, "b": 425.8, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.4, "r_y0": 289.5, "r_x1": 403.0, "r_y1": 289.5, "r_x2": 403.0, "r_y2": 281.0, "r_x3": 396.4, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 289.4, "r_x1": 425.1, "r_y1": 289.4, "r_x2": 425.1, "r_y2": 280.9, "r_x3": 418.6, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.7, "r_y0": 311.8, "r_x1": 402.3, "r_y1": 311.8, "r_x2": 402.3, "r_y2": 303.2, "r_x3": 395.7, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.5, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.4, "r_x3": 407.5, "r_y3": 303.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.6, "r_y0": 322.9, "r_x1": 414.1, "r_y1": 322.9, "r_x2": 414.1, "r_y2": 314.4, "r_x3": 407.6, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 300.6, "r_x1": 425.1, "r_y1": 300.6, "r_x2": 425.1, "r_y2": 292.1, "r_x3": 418.5, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.6, "r_x1": 436.2, "r_y1": 300.6, "r_x2": 436.2, "r_y2": 292.1, "r_x3": 429.6, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7, "r_y0": 300.5, "r_x1": 447.2, "r_y1": 300.5, "r_x2": 447.2, "r_y2": 292.0, "r_x3": 440.7, "r_y3": 292.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 311.8, "r_x1": 425.2, "r_y1": 311.8, "r_x2": 425.2, "r_y2": 303.3, "r_x3": 418.6, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 311.8, "r_x1": 436.3, "r_y1": 311.8, "r_x2": 436.3, "r_y2": 303.3, "r_x3": 429.7, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.7, "r_x1": 447.4, "r_y1": 311.7, "r_x2": 447.4, "r_y2": 303.2, "r_x3": 440.8, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 323.1, "r_x1": 425.2, "r_y1": 323.1, "r_x2": 425.2, "r_y2": 314.6, "r_x3": 418.6, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 323.1, "r_x1": 436.3, "r_y1": 323.1, "r_x2": 436.3, "r_y2": 314.6, "r_x3": 429.7, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.0, "r_x1": 447.4, "r_y1": 323.0, "r_x2": 447.4, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.8, "r_x1": 414.0, "r_y1": 333.8, "r_x2": 414.0, "r_y2": 325.3, "r_x3": 407.4, "r_y3": 325.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 334.0, "r_x1": 425.0, "r_y1": 334.0, "r_x2": 425.0, "r_y2": 325.5, "r_x3": 418.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.5, "r_y0": 334.0, "r_x1": 436.1, "r_y1": 334.0, "r_x2": 436.1, "r_y2": 325.5, "r_x3": 429.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.6, "r_y0": 333.9, "r_x1": 447.2, "r_y1": 333.9, "r_x2": 447.2, "r_y2": 325.4, "r_x3": 440.6, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.7, "r_x1": 463.5, "r_y1": 288.7, "r_x2": 463.5, "r_y2": 280.2, "r_x3": 451.9, "r_y3": 280.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 300.1, "r_x1": 463.8, "r_y1": 300.1, "r_x2": 463.8, "r_y2": 291.6, "r_x3": 452.2, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 311.4, "r_x1": 463.8, "r_y1": 311.4, "r_x2": 463.8, "r_y2": 302.8, "r_x3": 452.2, "r_y3": 302.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.6, "r_x1": 463.7, "r_y1": 322.6, "r_x2": 463.7, "r_y2": 314.1, "r_x3": 452.1, "r_y3": 314.1, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 334.0, "r_x1": 463.9, "r_y1": 334.0, "r_x2": 463.9, "r_y2": 325.5, "r_x3": 452.3, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.0, "r_x1": 402.7, "r_y1": 323.0, "r_x2": 402.7, "r_y2": 314.5, "r_x3": 396.1, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.9, "r_x1": 402.6, "r_y1": 333.9, "r_x2": 402.6, "r_y2": 325.4, "r_x3": 396.0, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 300.8, "r_x1": 402.8, "r_y1": 300.8, "r_x2": 402.8, "r_y2": 292.3, "r_x3": 396.3, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.5, "r_y0": 289.5, "r_x1": 413.6, "r_y1": 289.5, "r_x2": 413.6, "r_y2": 281.0, "r_x3": 408.5, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.6, "r_y0": 289.0, "r_x1": 435.6, "r_y1": 289.0, "r_x2": 435.6, "r_y2": 280.5, "r_x3": 430.6, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.1, "r_y0": 288.9, "r_x1": 446.1, "r_y1": 288.9, "r_x2": 446.1, "r_y2": 280.4, "r_x3": 441.1, "r_y3": 280.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.0, "r_y0": 300.7, "r_x1": 414.0, "r_y1": 300.7, "r_x2": 414.0, "r_y2": 292.1, "r_x3": 408.0, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.3, "r_y0": 419.7, "r_x1": 452.9, "r_y1": 419.7, "r_x2": 452.9, "r_y2": 411.2, "r_x3": 441.3, "r_y3": 411.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 406.9, "r_x1": 432.5, "r_y1": 406.9, "r_x2": 432.5, "r_y2": 399.8, "r_x3": 393.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.6, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.8, "r_x3": 434.6, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.9, "r_y0": 406.9, "r_x1": 463.2, "r_y1": 406.9, "r_x2": 463.2, "r_y2": 399.8, "r_x3": 440.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.1, "r_y0": 265.7, "r_x1": 414.0, "r_y1": 265.7, "r_x2": 414.0, "r_y2": 258.5, "r_x3": 384.1, "r_y3": 258.5, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 273.8, "r_x1": 451.5, "r_y1": 273.8, "r_x2": 451.5, "r_y2": 266.7, "r_x3": 393.8, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.6, "r_y0": 273.8, "r_x1": 462.0, "r_y1": 273.8, "r_x2": 462.0, "r_y2": 266.7, "r_x3": 453.6, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.8, "r_y0": 406.9, "r_x1": 233.9, "r_y1": 406.9, "r_x2": 233.9, "r_y2": 399.8, "r_x3": 151.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.0, "r_y0": 406.9, "r_x1": 244.4, "r_y1": 406.9, "r_x2": 244.4, "r_y2": 399.8, "r_x3": 236.0, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.5, "r_y0": 406.9, "r_x1": 268.8, "r_y1": 406.9, "r_x2": 268.8, "r_y2": 399.8, "r_x3": 246.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3, "r_y0": 220.7, "r_x1": 159.8, "r_y1": 220.7, "r_x2": 159.8, "r_y2": 213.6, "r_x3": 154.3, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.1, "r_y0": 220.7, "r_x1": 326.5, "r_y1": 220.7, "r_x2": 326.5, "r_y2": 213.6, "r_x3": 321.1, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 286.7, "r_x1": 175.8, "r_y1": 286.7, "r_x2": 175.8, "r_y2": 280.3, "r_x3": 153.1, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 293.5, "r_x1": 172.8, "r_y1": 293.5, "r_x2": 172.8, "r_y2": 287.1, "r_x3": 160.7, "r_y3": 287.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 300.3, "r_x1": 177.9, "r_y1": 300.3, "r_x2": 177.9, "r_y2": 293.9, "r_x3": 168.2, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.4, "r_y0": 300.3, "r_x1": 278.9, "r_y1": 300.3, "r_x2": 278.9, "r_y2": 293.9, "r_x3": 263.4, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.8, "r_y0": 300.3, "r_x1": 290.5, "r_y1": 300.3, "r_x2": 290.5, "r_y2": 293.9, "r_x3": 280.8, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.9, "r_y0": 300.3, "r_x1": 351.5, "r_y1": 300.3, "r_x2": 351.5, "r_y2": 293.9, "r_x3": 335.9, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 307.1, "r_x1": 174.7, "r_y1": 307.1, "r_x2": 174.7, "r_y2": 300.8, "r_x3": 160.7, "r_y3": 300.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 314.0, "r_x1": 172.8, "r_y1": 314.0, "r_x2": 172.8, "r_y2": 307.6, "r_x3": 160.7, "r_y3": 307.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 320.8, "r_x1": 181.9, "r_y1": 320.8, "r_x2": 181.9, "r_y2": 314.4, "r_x3": 168.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 320.8, "r_x1": 214.9, "r_y1": 320.8, "r_x2": 214.9, "r_y2": 314.4, "r_x3": 201.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 320.8, "r_x1": 247.8, "r_y1": 320.8, "r_x2": 247.8, "r_y2": 314.4, "r_x3": 234.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 327.6, "r_x1": 174.7, "r_y1": 327.6, "r_x2": 174.7, "r_y2": 321.2, "r_x3": 160.7, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 334.4, "r_x1": 172.8, "r_y1": 334.4, "r_x2": 172.8, "r_y2": 328.0, "r_x3": 160.7, "r_y3": 328.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 341.2, "r_x1": 373.1, "r_y1": 341.2, "r_x2": 373.1, "r_y2": 334.8, "r_x3": 168.2, "r_y3": 334.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 348.0, "r_x1": 174.7, "r_y1": 348.0, "r_x2": 174.7, "r_y2": 341.7, "r_x3": 160.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 354.9, "r_x1": 172.8, "r_y1": 354.9, "r_x2": 172.8, "r_y2": 348.5, "r_x3": 160.7, "r_y3": 348.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 361.7, "r_x1": 181.9, "r_y1": 361.7, "r_x2": 181.9, "r_y2": 355.3, "r_x3": 168.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 361.7, "r_x1": 214.9, "r_y1": 361.7, "r_x2": 214.9, "r_y2": 355.3, "r_x3": 201.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 361.7, "r_x1": 247.8, "r_y1": 361.7, "r_x2": 247.8, "r_y2": 355.3, "r_x3": 234.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 361.7, "r_x1": 280.8, "r_y1": 361.7, "r_x2": 280.8, "r_y2": 355.3, "r_x3": 267.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 368.5, "r_x1": 174.7, "r_y1": 368.5, "r_x2": 174.7, "r_y2": 362.1, "r_x3": 160.7, "r_y3": 362.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 375.3, "r_x1": 172.8, "r_y1": 375.3, "r_x2": 172.8, "r_y2": 368.9, "r_x3": 160.7, "r_y3": 368.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 382.1, "r_x1": 181.9, "r_y1": 382.1, "r_x2": 181.9, "r_y2": 375.7, "r_x3": 168.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 382.1, "r_x1": 214.9, "r_y1": 382.1, "r_x2": 214.9, "r_y2": 375.7, "r_x3": 201.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 382.1, "r_x1": 247.8, "r_y1": 382.1, "r_x2": 247.8, "r_y2": 375.7, "r_x3": 234.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 382.1, "r_x1": 280.8, "r_y1": 382.1, "r_x2": 280.8, "r_y2": 375.7, "r_x3": 267.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 388.9, "r_x1": 174.7, "r_y1": 388.9, "r_x2": 174.7, "r_y2": 382.6, "r_x3": 160.7, "r_y3": 382.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 395.8, "r_x1": 177.7, "r_y1": 395.8, "r_x2": 177.7, "r_y2": 389.4, "r_x3": 153.1, "r_y3": 389.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 320.8, "r_x1": 199.3, "r_y1": 320.8, "r_x2": 199.3, "r_y2": 314.4, "r_x3": 183.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 320.8, "r_x1": 232.3, "r_y1": 320.8, "r_x2": 232.3, "r_y2": 314.4, "r_x3": 216.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 320.8, "r_x1": 265.3, "r_y1": 320.8, "r_x2": 265.3, "r_y2": 314.4, "r_x3": 249.7, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 361.7, "r_x1": 199.3, "r_y1": 361.7, "r_x2": 199.3, "r_y2": 355.3, "r_x3": 183.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 361.7, "r_x1": 232.3, "r_y1": 361.7, "r_x2": 232.3, "r_y2": 355.3, "r_x3": 216.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 361.7, "r_x1": 265.3, "r_y1": 361.7, "r_x2": 265.3, "r_y2": 355.3, "r_x3": 249.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 361.7, "r_x1": 298.2, "r_y1": 361.7, "r_x2": 298.2, "r_y2": 355.3, "r_x3": 282.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 382.1, "r_x1": 199.3, "r_y1": 382.1, "r_x2": 199.3, "r_y2": 375.7, "r_x3": 183.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 382.1, "r_x1": 232.3, "r_y1": 382.1, "r_x2": 232.3, "r_y2": 375.7, "r_x3": 216.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 382.1, "r_x1": 265.3, "r_y1": 382.1, "r_x2": 265.3, "r_y2": 375.7, "r_x3": 249.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 382.1, "r_x1": 298.2, "r_y1": 382.1, "r_x2": 298.2, "r_y2": 375.7, "r_x3": 282.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.1, "r_y0": 419.9, "r_x1": 401.6, "r_y1": 419.9, "r_x2": 401.6, "r_y2": 411.3, "r_x3": 395.1, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 419.9, "r_x1": 412.5, "r_y1": 419.9, "r_x2": 412.5, "r_y2": 411.3, "r_x3": 407.4, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.7, "r_y0": 419.9, "r_x1": 425.3, "r_y1": 419.9, "r_x2": 425.3, "r_y2": 411.3, "r_x3": 418.7, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5, "r_y0": 419.9, "r_x1": 436.6, "r_y1": 419.9, "r_x2": 436.6, "r_y2": 411.3, "r_x3": 430.5, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.4, "r_y0": 416.2, "r_x1": 175.1, "r_y1": 416.2, "r_x2": 175.1, "r_y2": 409.8, "r_x3": 152.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.9, "r_y0": 416.2, "r_x1": 191.0, "r_y1": 416.2, "r_x2": 191.0, "r_y2": 409.8, "r_x3": 178.9, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.8, "r_y0": 416.2, "r_x1": 208.8, "r_y1": 416.2, "r_x2": 208.8, "r_y2": 409.8, "r_x3": 194.8, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.6, "r_y0": 416.2, "r_x1": 226.3, "r_y1": 416.2, "r_x2": 226.3, "r_y2": 409.8, "r_x3": 212.6, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.4, "r_y0": 416.2, "r_x1": 259.0, "r_y1": 416.2, "r_x2": 259.0, "r_y2": 409.8, "r_x3": 249.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.5, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.1, "r_x3": 244.5, "r_y3": 418.1, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.0, "r_y0": 416.2, "r_x1": 245.6, "r_y1": 416.2, "r_x2": 245.6, "r_y2": 409.8, "r_x3": 230.0, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 265.7, "r_x1": 159.6, "r_y1": 265.7, "r_x2": 159.6, "r_y2": 258.6, "r_x3": 154.5, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.7, "r_y0": 265.7, "r_x1": 185.2, "r_y1": 265.7, "r_x2": 185.2, "r_y2": 258.6, "r_x3": 164.7, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.4, "r_y0": 273.6, "r_x1": 222.1, "r_y1": 273.6, "r_x2": 222.1, "r_y2": 266.5, "r_x3": 164.4, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.2, "r_y0": 273.6, "r_x1": 232.6, "r_y1": 273.6, "r_x2": 232.6, "r_y2": 266.5, "r_x3": 224.2, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 396.4, "t": 281.0, "r": 403.0, "b": 289.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.4, "r_y0": 289.5, "r_x1": 403.0, "r_y1": 289.5, "r_x2": 403.0, "r_y2": 281.0, "r_x3": 396.4, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 418.6, "t": 280.9, "r": 425.1, "b": 289.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 289.4, "r_x1": 425.1, "r_y1": 289.4, "r_x2": 425.1, "r_y2": 280.9, "r_x3": 418.6, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 395.7, "t": 303.2, "r": 402.3, "b": 311.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.7, "r_y0": 311.8, "r_x1": 402.3, "r_y1": 311.8, "r_x2": 402.3, "r_y2": 303.2, "r_x3": 395.7, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 407.5, "t": 303.4, "r": 414.1, "b": 311.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.5, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.4, "r_x3": 407.5, "r_y3": 303.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 407.6, "t": 314.4, "r": 414.1, "b": 322.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.6, "r_y0": 322.9, "r_x1": 414.1, "r_y1": 322.9, "r_x2": 414.1, "r_y2": 314.4, "r_x3": 407.6, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 418.5, "t": 292.1, "r": 425.1, "b": 300.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 300.6, "r_x1": 425.1, "r_y1": 300.6, "r_x2": 425.1, "r_y2": 292.1, "r_x3": 418.5, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 429.6, "t": 292.1, "r": 436.2, "b": 300.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.6, "r_x1": 436.2, "r_y1": 300.6, "r_x2": 436.2, "r_y2": 292.1, "r_x3": 429.6, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 440.7, "t": 292.0, "r": 447.2, "b": 300.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7, "r_y0": 300.5, "r_x1": 447.2, "r_y1": 300.5, "r_x2": 447.2, "r_y2": 292.0, "r_x3": 440.7, "r_y3": 292.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 418.6, "t": 303.3, "r": 425.2, "b": 311.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 311.8, "r_x1": 425.2, "r_y1": 311.8, "r_x2": 425.2, "r_y2": 303.3, "r_x3": 418.6, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 429.7, "t": 303.3, "r": 436.3, "b": 311.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 311.8, "r_x1": 436.3, "r_y1": 311.8, "r_x2": 436.3, "r_y2": 303.3, "r_x3": 429.7, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 440.8, "t": 303.2, "r": 447.4, "b": 311.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.7, "r_x1": 447.4, "r_y1": 311.7, "r_x2": 447.4, "r_y2": 303.2, "r_x3": 440.8, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 418.6, "t": 314.6, "r": 425.2, "b": 323.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 323.1, "r_x1": 425.2, "r_y1": 323.1, "r_x2": 425.2, "r_y2": 314.6, "r_x3": 418.6, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 429.7, "t": 314.6, "r": 436.3, "b": 323.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 323.1, "r_x1": 436.3, "r_y1": 323.1, "r_x2": 436.3, "r_y2": 314.6, "r_x3": 429.7, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 440.8, "t": 314.5, "r": 447.4, "b": 323.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.0, "r_x1": 447.4, "r_y1": 323.0, "r_x2": 447.4, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 407.4, "t": 325.3, "r": 414.0, "b": 333.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.8, "r_x1": 414.0, "r_y1": 333.8, "r_x2": 414.0, "r_y2": 325.3, "r_x3": 407.4, "r_y3": 325.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 418.5, "t": 325.5, "r": 425.0, "b": 334.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 334.0, "r_x1": 425.0, "r_y1": 334.0, "r_x2": 425.0, "r_y2": 325.5, "r_x3": 418.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 429.5, "t": 325.5, "r": 436.1, "b": 334.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.5, "r_y0": 334.0, "r_x1": 436.1, "r_y1": 334.0, "r_x2": 436.1, "r_y2": 325.5, "r_x3": 429.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 440.6, "t": 325.4, "r": 447.2, "b": 333.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.6, "r_y0": 333.9, "r_x1": 447.2, "r_y1": 333.9, "r_x2": 447.2, "r_y2": 325.4, "r_x3": 440.6, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 451.9, "t": 280.2, "r": 463.5, "b": 288.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.7, "r_x1": 463.5, "r_y1": 288.7, "r_x2": 463.5, "r_y2": 280.2, "r_x3": 451.9, "r_y3": 280.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 452.2, "t": 291.6, "r": 463.8, "b": 300.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 300.1, "r_x1": 463.8, "r_y1": 300.1, "r_x2": 463.8, "r_y2": 291.6, "r_x3": 452.2, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 452.2, "t": 302.8, "r": 463.8, "b": 311.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 311.4, "r_x1": 463.8, "r_y1": 311.4, "r_x2": 463.8, "r_y2": 302.8, "r_x3": 452.2, "r_y3": 302.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 452.1, "t": 314.1, "r": 463.7, "b": 322.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.6, "r_x1": 463.7, "r_y1": 322.6, "r_x2": 463.7, "r_y2": 314.1, "r_x3": 452.1, "r_y3": 314.1, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 452.3, "t": 325.5, "r": 463.9, "b": 334.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 334.0, "r_x1": 463.9, "r_y1": 334.0, "r_x2": 463.9, "r_y2": 325.5, "r_x3": 452.3, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 396.1, "t": 314.5, "r": 402.7, "b": 323.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.0, "r_x1": 402.7, "r_y1": 323.0, "r_x2": 402.7, "r_y2": 314.5, "r_x3": 396.1, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 396.0, "t": 325.4, "r": 402.6, "b": 333.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.9, "r_x1": 402.6, "r_y1": 333.9, "r_x2": 402.6, "r_y2": 325.4, "r_x3": 396.0, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.3, "t": 292.3, "r": 402.8, "b": 300.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 300.8, "r_x1": 402.8, "r_y1": 300.8, "r_x2": 402.8, "r_y2": 292.3, "r_x3": 396.3, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 408.5, "t": 281.0, "r": 413.6, "b": 289.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.5, "r_y0": 289.5, "r_x1": 413.6, "r_y1": 289.5, "r_x2": 413.6, "r_y2": 281.0, "r_x3": 408.5, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 430.6, "t": 280.5, "r": 435.6, "b": 289.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.6, "r_y0": 289.0, "r_x1": 435.6, "r_y1": 289.0, "r_x2": 435.6, "r_y2": 280.5, "r_x3": 430.6, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 441.1, "t": 280.4, "r": 446.1, "b": 288.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.1, "r_y0": 288.9, "r_x1": 446.1, "r_y1": 288.9, "r_x2": 446.1, "r_y2": 280.4, "r_x3": 441.1, "r_y3": 280.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 408.0, "t": 292.1, "r": 414.0, "b": 300.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.0, "r_y0": 300.7, "r_x1": 414.0, "r_y1": 300.7, "r_x2": 414.0, "r_y2": 292.1, "r_x3": 408.0, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 441.3, "t": 411.2, "r": 452.9, "b": 419.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.3, "r_y0": 419.7, "r_x1": 452.9, "r_y1": 419.7, "r_x2": 452.9, "r_y2": 411.2, "r_x3": 441.3, "r_y3": 411.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 393.8, "t": 399.8, "r": 432.5, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 406.9, "r_x1": 432.5, "r_y1": 406.9, "r_x2": 432.5, "r_y2": 399.8, "r_x3": 393.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 434.6, "t": 399.8, "r": 438.8, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.6, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.8, "r_x3": 434.6, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 440.9, "t": 399.8, "r": 463.2, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.9, "r_y0": 406.9, "r_x1": 463.2, "r_y1": 406.9, "r_x2": 463.2, "r_y2": 399.8, "r_x3": 440.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 384.1, "t": 258.5, "r": 414.0, "b": 265.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.1, "r_y0": 265.7, "r_x1": 414.0, "r_y1": 265.7, "r_x2": 414.0, "r_y2": 258.5, "r_x3": 384.1, "r_y3": 258.5, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 393.8, "t": 266.7, "r": 451.5, "b": 273.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 273.8, "r_x1": 451.5, "r_y1": 273.8, "r_x2": 451.5, "r_y2": 266.7, "r_x3": 393.8, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 453.6, "t": 266.7, "r": 462.0, "b": 273.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.6, "r_y0": 273.8, "r_x1": 462.0, "r_y1": 273.8, "r_x2": 462.0, "r_y2": 266.7, "r_x3": 453.6, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 151.8, "t": 399.8, "r": 233.9, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.8, "r_y0": 406.9, "r_x1": 233.9, "r_y1": 406.9, "r_x2": 233.9, "r_y2": 399.8, "r_x3": 151.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 236.0, "t": 399.8, "r": 244.4, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.0, "r_y0": 406.9, "r_x1": 244.4, "r_y1": 406.9, "r_x2": 244.4, "r_y2": 399.8, "r_x3": 236.0, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 246.5, "t": 399.8, "r": 268.8, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.5, "r_y0": 406.9, "r_x1": 268.8, "r_y1": 406.9, "r_x2": 268.8, "r_y2": 399.8, "r_x3": 246.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 154.3, "t": 213.6, "r": 159.8, "b": 220.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3, "r_y0": 220.7, "r_x1": 159.8, "r_y1": 220.7, "r_x2": 159.8, "r_y2": 213.6, "r_x3": 154.3, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 321.1, "t": 213.6, "r": 326.5, "b": 220.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.1, "r_y0": 220.7, "r_x1": 326.5, "r_y1": 220.7, "r_x2": 326.5, "r_y2": 213.6, "r_x3": 321.1, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 153.1, "t": 280.3, "r": 175.8, "b": 286.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 286.7, "r_x1": 175.8, "r_y1": 286.7, "r_x2": 175.8, "r_y2": 280.3, "r_x3": 153.1, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 160.7, "t": 287.1, "r": 172.8, "b": 293.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 293.5, "r_x1": 172.8, "r_y1": 293.5, "r_x2": 172.8, "r_y2": 287.1, "r_x3": 160.7, "r_y3": 287.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 168.2, "t": 293.9, "r": 177.9, "b": 300.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 300.3, "r_x1": 177.9, "r_y1": 300.3, "r_x2": 177.9, "r_y2": 293.9, "r_x3": 168.2, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 263.4, "t": 293.9, "r": 278.9, "b": 300.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.4, "r_y0": 300.3, "r_x1": 278.9, "r_y1": 300.3, "r_x2": 278.9, "r_y2": 293.9, "r_x3": 263.4, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 280.8, "t": 293.9, "r": 290.5, "b": 300.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.8, "r_y0": 300.3, "r_x1": 290.5, "r_y1": 300.3, "r_x2": 290.5, "r_y2": 293.9, "r_x3": 280.8, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 335.9, "t": 293.9, "r": 351.5, "b": 300.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.9, "r_y0": 300.3, "r_x1": 351.5, "r_y1": 300.3, "r_x2": 351.5, "r_y2": 293.9, "r_x3": 335.9, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 160.7, "t": 300.8, "r": 174.7, "b": 307.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 307.1, "r_x1": 174.7, "r_y1": 307.1, "r_x2": 174.7, "r_y2": 300.8, "r_x3": 160.7, "r_y3": 300.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 160.7, "t": 307.6, "r": 172.8, "b": 314.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 314.0, "r_x1": 172.8, "r_y1": 314.0, "r_x2": 172.8, "r_y2": 307.6, "r_x3": 160.7, "r_y3": 307.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 168.2, "t": 314.4, "r": 181.9, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 320.8, "r_x1": 181.9, "r_y1": 320.8, "r_x2": 181.9, "r_y2": 314.4, "r_x3": 168.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 201.2, "t": 314.4, "r": 214.9, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 320.8, "r_x1": 214.9, "r_y1": 320.8, "r_x2": 214.9, "r_y2": 314.4, "r_x3": 201.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 234.2, "t": 314.4, "r": 247.8, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 320.8, "r_x1": 247.8, "r_y1": 320.8, "r_x2": 247.8, "r_y2": 314.4, "r_x3": 234.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 160.7, "t": 321.2, "r": 174.7, "b": 327.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 327.6, "r_x1": 174.7, "r_y1": 327.6, "r_x2": 174.7, "r_y2": 321.2, "r_x3": 160.7, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 160.7, "t": 328.0, "r": 172.8, "b": 334.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 334.4, "r_x1": 172.8, "r_y1": 334.4, "r_x2": 172.8, "r_y2": 328.0, "r_x3": 160.7, "r_y3": 328.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 168.2, "t": 334.8, "r": 373.1, "b": 341.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 341.2, "r_x1": 373.1, "r_y1": 341.2, "r_x2": 373.1, "r_y2": 334.8, "r_x3": 168.2, "r_y3": 334.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 160.7, "t": 341.7, "r": 174.7, "b": 348.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 348.0, "r_x1": 174.7, "r_y1": 348.0, "r_x2": 174.7, "r_y2": 341.7, "r_x3": 160.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 160.7, "t": 348.5, "r": 172.8, "b": 354.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 354.9, "r_x1": 172.8, "r_y1": 354.9, "r_x2": 172.8, "r_y2": 348.5, "r_x3": 160.7, "r_y3": 348.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 168.2, "t": 355.3, "r": 181.9, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 361.7, "r_x1": 181.9, "r_y1": 361.7, "r_x2": 181.9, "r_y2": 355.3, "r_x3": 168.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 201.2, "t": 355.3, "r": 214.9, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 361.7, "r_x1": 214.9, "r_y1": 361.7, "r_x2": 214.9, "r_y2": 355.3, "r_x3": 201.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 234.2, "t": 355.3, "r": 247.8, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 361.7, "r_x1": 247.8, "r_y1": 361.7, "r_x2": 247.8, "r_y2": 355.3, "r_x3": 234.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 267.2, "t": 355.3, "r": 280.8, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 361.7, "r_x1": 280.8, "r_y1": 361.7, "r_x2": 280.8, "r_y2": 355.3, "r_x3": 267.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 160.7, "t": 362.1, "r": 174.7, "b": 368.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 368.5, "r_x1": 174.7, "r_y1": 368.5, "r_x2": 174.7, "r_y2": 362.1, "r_x3": 160.7, "r_y3": 362.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 160.7, "t": 368.9, "r": 172.8, "b": 375.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 375.3, "r_x1": 172.8, "r_y1": 375.3, "r_x2": 172.8, "r_y2": 368.9, "r_x3": 160.7, "r_y3": 368.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 168.2, "t": 375.7, "r": 181.9, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 382.1, "r_x1": 181.9, "r_y1": 382.1, "r_x2": 181.9, "r_y2": 375.7, "r_x3": 168.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 201.2, "t": 375.7, "r": 214.9, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 382.1, "r_x1": 214.9, "r_y1": 382.1, "r_x2": 214.9, "r_y2": 375.7, "r_x3": 201.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 234.2, "t": 375.7, "r": 247.8, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 382.1, "r_x1": 247.8, "r_y1": 382.1, "r_x2": 247.8, "r_y2": 375.7, "r_x3": 234.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 267.2, "t": 375.7, "r": 280.8, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 382.1, "r_x1": 280.8, "r_y1": 382.1, "r_x2": 280.8, "r_y2": 375.7, "r_x3": 267.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 160.7, "t": 382.6, "r": 174.7, "b": 388.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 388.9, "r_x1": 174.7, "r_y1": 388.9, "r_x2": 174.7, "r_y2": 382.6, "r_x3": 160.7, "r_y3": 382.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 153.1, "t": 389.4, "r": 177.7, "b": 395.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 395.8, "r_x1": 177.7, "r_y1": 395.8, "r_x2": 177.7, "r_y2": 389.4, "r_x3": 153.1, "r_y3": 389.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.8, "t": 314.4, "r": 199.3, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 320.8, "r_x1": 199.3, "r_y1": 320.8, "r_x2": 199.3, "r_y2": 314.4, "r_x3": 183.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 216.8, "t": 314.4, "r": 232.3, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 320.8, "r_x1": 232.3, "r_y1": 320.8, "r_x2": 232.3, "r_y2": 314.4, "r_x3": 216.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 249.7, "t": 314.4, "r": 265.3, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 320.8, "r_x1": 265.3, "r_y1": 320.8, "r_x2": 265.3, "r_y2": 314.4, "r_x3": 249.7, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 183.8, "t": 355.3, "r": 199.3, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 361.7, "r_x1": 199.3, "r_y1": 361.7, "r_x2": 199.3, "r_y2": 355.3, "r_x3": 183.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 216.8, "t": 355.3, "r": 232.3, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 361.7, "r_x1": 232.3, "r_y1": 361.7, "r_x2": 232.3, "r_y2": 355.3, "r_x3": 216.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 249.7, "t": 355.3, "r": 265.3, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 361.7, "r_x1": 265.3, "r_y1": 361.7, "r_x2": 265.3, "r_y2": 355.3, "r_x3": 249.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 282.7, "t": 355.3, "r": 298.2, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 361.7, "r_x1": 298.2, "r_y1": 361.7, "r_x2": 298.2, "r_y2": 355.3, "r_x3": 282.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.8, "t": 375.7, "r": 199.3, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 382.1, "r_x1": 199.3, "r_y1": 382.1, "r_x2": 199.3, "r_y2": 375.7, "r_x3": 183.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 216.8, "t": 375.7, "r": 232.3, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 382.1, "r_x1": 232.3, "r_y1": 382.1, "r_x2": 232.3, "r_y2": 375.7, "r_x3": 216.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 249.7, "t": 375.7, "r": 265.3, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 382.1, "r_x1": 265.3, "r_y1": 382.1, "r_x2": 265.3, "r_y2": 375.7, "r_x3": 249.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 282.7, "t": 375.7, "r": 298.2, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 382.1, "r_x1": 298.2, "r_y1": 382.1, "r_x2": 298.2, "r_y2": 375.7, "r_x3": 282.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 395.1, "t": 411.3, "r": 401.6, "b": 419.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.1, "r_y0": 419.9, "r_x1": 401.6, "r_y1": 419.9, "r_x2": 401.6, "r_y2": 411.3, "r_x3": 395.1, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 407.4, "t": 411.3, "r": 412.5, "b": 419.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 419.9, "r_x1": 412.5, "r_y1": 419.9, "r_x2": 412.5, "r_y2": 411.3, "r_x3": 407.4, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 418.7, "t": 411.3, "r": 425.3, "b": 419.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.7, "r_y0": 419.9, "r_x1": 425.3, "r_y1": 419.9, "r_x2": 425.3, "r_y2": 411.3, "r_x3": 418.7, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 430.5, "t": 411.3, "r": 436.6, "b": 419.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5, "r_y0": 419.9, "r_x1": 436.6, "r_y1": 419.9, "r_x2": 436.6, "r_y2": 411.3, "r_x3": 430.5, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 152.4, "t": 409.8, "r": 175.1, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.4, "r_y0": 416.2, "r_x1": 175.1, "r_y1": 416.2, "r_x2": 175.1, "r_y2": 409.8, "r_x3": 152.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 178.9, "t": 409.8, "r": 191.0, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.9, "r_y0": 416.2, "r_x1": 191.0, "r_y1": 416.2, "r_x2": 191.0, "r_y2": 409.8, "r_x3": 178.9, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 194.8, "t": 409.8, "r": 208.8, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.8, "r_y0": 416.2, "r_x1": 208.8, "r_y1": 416.2, "r_x2": 208.8, "r_y2": 409.8, "r_x3": 194.8, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 212.6, "t": 409.8, "r": 226.3, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.6, "r_y0": 416.2, "r_x1": 226.3, "r_y1": 416.2, "r_x2": 226.3, "r_y2": 409.8, "r_x3": 212.6, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 249.4, "t": 409.8, "r": 259.0, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.4, "r_y0": 416.2, "r_x1": 259.0, "r_y1": 416.2, "r_x2": 259.0, "r_y2": 409.8, "r_x3": 249.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 244.5, "t": 418.1, "r": 269.1, "b": 424.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.5, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.1, "r_x3": 244.5, "r_y3": 418.1, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 230.0, "t": 409.8, "r": 245.6, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.0, "r_y0": 416.2, "r_x1": 245.6, "r_y1": 416.2, "r_x2": 245.6, "r_y2": 409.8, "r_x3": 230.0, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 154.5, "t": 258.6, "r": 159.6, "b": 265.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 265.7, "r_x1": 159.6, "r_y1": 265.7, "r_x2": 159.6, "r_y2": 258.6, "r_x3": 154.5, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 164.7, "t": 258.6, "r": 185.2, "b": 265.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.7, "r_y0": 265.7, "r_x1": 185.2, "r_y1": 265.7, "r_x2": 185.2, "r_y2": 258.6, "r_x3": 164.7, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 164.4, "t": 266.5, "r": 222.1, "b": 273.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.4, "r_y0": 273.6, "r_x1": 222.1, "r_y1": 273.6, "r_x2": 222.1, "r_y2": 266.5, "r_x3": 164.4, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 224.2, "t": 266.5, "r": 232.6, "b": 273.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.2, "r_y0": 273.6, "r_x1": 232.6, "r_y1": 273.6, "r_x2": 232.6, "r_y2": 266.5, "r_x3": 224.2, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 452.3, "r": 480.6, "b": 520.9, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 461.1, "r_x1": 161.3, "r_y1": 461.1, "r_x2": 161.3, "r_y2": 452.3, "r_x3": 134.8, "r_y3": 452.3, "coord_origin": "TOPLEFT" }, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.3, "r_y0": 461.1, "r_x1": 226.3, "r_y1": 461.1, "r_x2": 226.3, "r_y2": 452.3, "r_x3": 164.3, "r_y3": 452.3, "coord_origin": "TOPLEFT" }, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.0, "r_y0": 461.1, "r_x1": 480.6, "r_y1": 461.1, "r_x2": 480.6, "r_y2": 452.3, "r_x3": 230.0, "r_y3": 452.3, "coord_origin": "TOPLEFT" }, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 473.1, "r_x1": 480.6, "r_y1": 473.1, "r_x2": 480.6, "r_y2": 464.3, "r_x3": 134.8, "r_y3": 464.3, "coord_origin": "TOPLEFT" }, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 485.0, "r_x1": 480.6, "r_y1": 485.0, "r_x2": 480.6, "r_y2": 476.2, "r_x3": 134.8, "r_y3": 476.2, "coord_origin": "TOPLEFT" }, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 497.0, "r_x1": 480.6, "r_y1": 497.0, "r_x2": 480.6, "r_y2": 488.2, "r_x3": 134.8, "r_y3": 488.2, "coord_origin": "TOPLEFT" }, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 508.9, "r_x1": 480.6, "r_y1": 508.9, "r_x2": 480.6, "r_y2": 500.1, "r_x3": 134.8, "r_y3": 500.1, "coord_origin": "TOPLEFT" }, "text": "area of research, in which many novel machine learning algorithms are being", "orig": "area of research, in which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 520.9, "r_x1": 313.2, "r_y1": 520.9, "r_x2": 313.2, "r_y2": 512.1, "r_x3": 134.8, "r_y3": 512.1, "coord_origin": "TOPLEFT" }, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 524.6, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.6, "r_x3": 149.7, "r_y3": 524.6, "coord_origin": "TOPLEFT" }, "text": "Recently emerging SOTA methods for table structure recognition employ", "orig": "Recently emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 480.6, "r_y1": 581.2, "r_x2": 480.6, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 421.5, "r_y1": 664.9, "r_x2": 421.5, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 5, "page_no": 1, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 139.4, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2" }, { "label": "page_header", "id": 3, "page_no": 1, "cluster": { "id": 3, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.91, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "caption", "id": 4, "page_no": 1, "cluster": { "id": 4, "label": "caption", "bbox": { "l": 134.8, "t": 126.3, "r": 480.6, "b": 200.2, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 134.3, "r_x1": 162.6, "r_y1": 134.3, "r_x2": 162.6, "r_y2": 126.3, "r_x3": 134.8, "r_y3": 126.3, "coord_origin": "TOPLEFT" }, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.1, "r_y0": 134.5, "r_x1": 480.6, "r_y1": 134.5, "r_x2": 480.6, "r_y2": 126.4, "r_x3": 167.1, "r_y3": 126.4, "coord_origin": "TOPLEFT" }, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 145.4, "r_x1": 480.6, "r_y1": 145.4, "r_x2": 480.6, "r_y2": 137.4, "r_x3": 134.8, "r_y3": 137.4, "coord_origin": "TOPLEFT" }, "text": "table-example with complex row and column headers, including a 2D empty span,", "orig": "table-example with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 156.4, "r_x1": 148.0, "r_y1": 156.4, "r_x2": 148.0, "r_y2": 148.3, "r_x3": 134.8, "r_y3": 148.3, "coord_origin": "TOPLEFT" }, "text": "(B)", "orig": "(B)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.4, "r_y0": 156.4, "r_x1": 480.6, "r_y1": 156.4, "r_x2": 480.6, "r_y2": 148.3, "r_x3": 152.4, "r_y3": 148.3, "coord_origin": "TOPLEFT" }, "text": "minimal graphical representation of table structure using rectangular layout, (C)", "orig": "minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 167.3, "r_x1": 480.6, "r_y1": 167.3, "r_x2": 480.6, "r_y2": 159.3, "r_x3": 134.8, "r_y3": 159.3, "coord_origin": "TOPLEFT" }, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 178.3, "r_x1": 480.6, "r_y1": 178.3, "r_x2": 480.6, "r_y2": 170.2, "r_x3": 134.8, "r_y3": 170.2, "coord_origin": "TOPLEFT" }, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 189.3, "r_x1": 480.6, "r_y1": 189.3, "r_x2": 480.6, "r_y2": 181.2, "r_x3": 134.8, "r_y3": 181.2, "coord_origin": "TOPLEFT" }, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 200.2, "r_x1": 460.9, "r_y1": 200.2, "r_x2": 460.9, "r_y2": 192.2, "r_x3": 134.8, "r_y3": 192.2, "coord_origin": "TOPLEFT" }, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 1. Comparison between HTML and OTSL table structure representation: (A) table-example with complex row and column headers, including a 2D empty span, (B) minimal graphical representation of table structure using rectangular layout, (C) HTML representation, (D) OTSL representation. This example demonstrates many of the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case), its reduced sequence length (55 versus 30) and a enhanced internal structure (variable token sequence length per row in HTML versus a fixed length of rows in OTSL)." }, { "label": "picture", "id": 1, "page_no": 1, "cluster": { "id": 1, "label": "picture", "bbox": { "l": 148.5, "t": 208.4, "r": 464.4, "b": 425.8, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.4, "r_y0": 289.5, "r_x1": 403.0, "r_y1": 289.5, "r_x2": 403.0, "r_y2": 281.0, "r_x3": 396.4, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 289.4, "r_x1": 425.1, "r_y1": 289.4, "r_x2": 425.1, "r_y2": 280.9, "r_x3": 418.6, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.7, "r_y0": 311.8, "r_x1": 402.3, "r_y1": 311.8, "r_x2": 402.3, "r_y2": 303.2, "r_x3": 395.7, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.5, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.4, "r_x3": 407.5, "r_y3": 303.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.6, "r_y0": 322.9, "r_x1": 414.1, "r_y1": 322.9, "r_x2": 414.1, "r_y2": 314.4, "r_x3": 407.6, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 300.6, "r_x1": 425.1, "r_y1": 300.6, "r_x2": 425.1, "r_y2": 292.1, "r_x3": 418.5, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.6, "r_x1": 436.2, "r_y1": 300.6, "r_x2": 436.2, "r_y2": 292.1, "r_x3": 429.6, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7, "r_y0": 300.5, "r_x1": 447.2, "r_y1": 300.5, "r_x2": 447.2, "r_y2": 292.0, "r_x3": 440.7, "r_y3": 292.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 311.8, "r_x1": 425.2, "r_y1": 311.8, "r_x2": 425.2, "r_y2": 303.3, "r_x3": 418.6, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 311.8, "r_x1": 436.3, "r_y1": 311.8, "r_x2": 436.3, "r_y2": 303.3, "r_x3": 429.7, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.7, "r_x1": 447.4, "r_y1": 311.7, "r_x2": 447.4, "r_y2": 303.2, "r_x3": 440.8, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 323.1, "r_x1": 425.2, "r_y1": 323.1, "r_x2": 425.2, "r_y2": 314.6, "r_x3": 418.6, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 323.1, "r_x1": 436.3, "r_y1": 323.1, "r_x2": 436.3, "r_y2": 314.6, "r_x3": 429.7, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.0, "r_x1": 447.4, "r_y1": 323.0, "r_x2": 447.4, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.8, "r_x1": 414.0, "r_y1": 333.8, "r_x2": 414.0, "r_y2": 325.3, "r_x3": 407.4, "r_y3": 325.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 334.0, "r_x1": 425.0, "r_y1": 334.0, "r_x2": 425.0, "r_y2": 325.5, "r_x3": 418.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.5, "r_y0": 334.0, "r_x1": 436.1, "r_y1": 334.0, "r_x2": 436.1, "r_y2": 325.5, "r_x3": 429.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.6, "r_y0": 333.9, "r_x1": 447.2, "r_y1": 333.9, "r_x2": 447.2, "r_y2": 325.4, "r_x3": 440.6, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.7, "r_x1": 463.5, "r_y1": 288.7, "r_x2": 463.5, "r_y2": 280.2, "r_x3": 451.9, "r_y3": 280.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 300.1, "r_x1": 463.8, "r_y1": 300.1, "r_x2": 463.8, "r_y2": 291.6, "r_x3": 452.2, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 311.4, "r_x1": 463.8, "r_y1": 311.4, "r_x2": 463.8, "r_y2": 302.8, "r_x3": 452.2, "r_y3": 302.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.6, "r_x1": 463.7, "r_y1": 322.6, "r_x2": 463.7, "r_y2": 314.1, "r_x3": 452.1, "r_y3": 314.1, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 334.0, "r_x1": 463.9, "r_y1": 334.0, "r_x2": 463.9, "r_y2": 325.5, "r_x3": 452.3, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.0, "r_x1": 402.7, "r_y1": 323.0, "r_x2": 402.7, "r_y2": 314.5, "r_x3": 396.1, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.9, "r_x1": 402.6, "r_y1": 333.9, "r_x2": 402.6, "r_y2": 325.4, "r_x3": 396.0, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 300.8, "r_x1": 402.8, "r_y1": 300.8, "r_x2": 402.8, "r_y2": 292.3, "r_x3": 396.3, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.5, "r_y0": 289.5, "r_x1": 413.6, "r_y1": 289.5, "r_x2": 413.6, "r_y2": 281.0, "r_x3": 408.5, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.6, "r_y0": 289.0, "r_x1": 435.6, "r_y1": 289.0, "r_x2": 435.6, "r_y2": 280.5, "r_x3": 430.6, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.1, "r_y0": 288.9, "r_x1": 446.1, "r_y1": 288.9, "r_x2": 446.1, "r_y2": 280.4, "r_x3": 441.1, "r_y3": 280.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.0, "r_y0": 300.7, "r_x1": 414.0, "r_y1": 300.7, "r_x2": 414.0, "r_y2": 292.1, "r_x3": 408.0, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.3, "r_y0": 419.7, "r_x1": 452.9, "r_y1": 419.7, "r_x2": 452.9, "r_y2": 411.2, "r_x3": 441.3, "r_y3": 411.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 406.9, "r_x1": 432.5, "r_y1": 406.9, "r_x2": 432.5, "r_y2": 399.8, "r_x3": 393.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.6, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.8, "r_x3": 434.6, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.9, "r_y0": 406.9, "r_x1": 463.2, "r_y1": 406.9, "r_x2": 463.2, "r_y2": 399.8, "r_x3": 440.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.1, "r_y0": 265.7, "r_x1": 414.0, "r_y1": 265.7, "r_x2": 414.0, "r_y2": 258.5, "r_x3": 384.1, "r_y3": 258.5, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 273.8, "r_x1": 451.5, "r_y1": 273.8, "r_x2": 451.5, "r_y2": 266.7, "r_x3": 393.8, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.6, "r_y0": 273.8, "r_x1": 462.0, "r_y1": 273.8, "r_x2": 462.0, "r_y2": 266.7, "r_x3": 453.6, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.8, "r_y0": 406.9, "r_x1": 233.9, "r_y1": 406.9, "r_x2": 233.9, "r_y2": 399.8, "r_x3": 151.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.0, "r_y0": 406.9, "r_x1": 244.4, "r_y1": 406.9, "r_x2": 244.4, "r_y2": 399.8, "r_x3": 236.0, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.5, "r_y0": 406.9, "r_x1": 268.8, "r_y1": 406.9, "r_x2": 268.8, "r_y2": 399.8, "r_x3": 246.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3, "r_y0": 220.7, "r_x1": 159.8, "r_y1": 220.7, "r_x2": 159.8, "r_y2": 213.6, "r_x3": 154.3, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.1, "r_y0": 220.7, "r_x1": 326.5, "r_y1": 220.7, "r_x2": 326.5, "r_y2": 213.6, "r_x3": 321.1, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 286.7, "r_x1": 175.8, "r_y1": 286.7, "r_x2": 175.8, "r_y2": 280.3, "r_x3": 153.1, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 293.5, "r_x1": 172.8, "r_y1": 293.5, "r_x2": 172.8, "r_y2": 287.1, "r_x3": 160.7, "r_y3": 287.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 300.3, "r_x1": 177.9, "r_y1": 300.3, "r_x2": 177.9, "r_y2": 293.9, "r_x3": 168.2, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.4, "r_y0": 300.3, "r_x1": 278.9, "r_y1": 300.3, "r_x2": 278.9, "r_y2": 293.9, "r_x3": 263.4, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.8, "r_y0": 300.3, "r_x1": 290.5, "r_y1": 300.3, "r_x2": 290.5, "r_y2": 293.9, "r_x3": 280.8, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.9, "r_y0": 300.3, "r_x1": 351.5, "r_y1": 300.3, "r_x2": 351.5, "r_y2": 293.9, "r_x3": 335.9, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 307.1, "r_x1": 174.7, "r_y1": 307.1, "r_x2": 174.7, "r_y2": 300.8, "r_x3": 160.7, "r_y3": 300.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 314.0, "r_x1": 172.8, "r_y1": 314.0, "r_x2": 172.8, "r_y2": 307.6, "r_x3": 160.7, "r_y3": 307.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 320.8, "r_x1": 181.9, "r_y1": 320.8, "r_x2": 181.9, "r_y2": 314.4, "r_x3": 168.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 320.8, "r_x1": 214.9, "r_y1": 320.8, "r_x2": 214.9, "r_y2": 314.4, "r_x3": 201.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 320.8, "r_x1": 247.8, "r_y1": 320.8, "r_x2": 247.8, "r_y2": 314.4, "r_x3": 234.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 327.6, "r_x1": 174.7, "r_y1": 327.6, "r_x2": 174.7, "r_y2": 321.2, "r_x3": 160.7, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 334.4, "r_x1": 172.8, "r_y1": 334.4, "r_x2": 172.8, "r_y2": 328.0, "r_x3": 160.7, "r_y3": 328.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 341.2, "r_x1": 373.1, "r_y1": 341.2, "r_x2": 373.1, "r_y2": 334.8, "r_x3": 168.2, "r_y3": 334.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 348.0, "r_x1": 174.7, "r_y1": 348.0, "r_x2": 174.7, "r_y2": 341.7, "r_x3": 160.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 354.9, "r_x1": 172.8, "r_y1": 354.9, "r_x2": 172.8, "r_y2": 348.5, "r_x3": 160.7, "r_y3": 348.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 361.7, "r_x1": 181.9, "r_y1": 361.7, "r_x2": 181.9, "r_y2": 355.3, "r_x3": 168.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 361.7, "r_x1": 214.9, "r_y1": 361.7, "r_x2": 214.9, "r_y2": 355.3, "r_x3": 201.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 361.7, "r_x1": 247.8, "r_y1": 361.7, "r_x2": 247.8, "r_y2": 355.3, "r_x3": 234.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 361.7, "r_x1": 280.8, "r_y1": 361.7, "r_x2": 280.8, "r_y2": 355.3, "r_x3": 267.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 368.5, "r_x1": 174.7, "r_y1": 368.5, "r_x2": 174.7, "r_y2": 362.1, "r_x3": 160.7, "r_y3": 362.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 375.3, "r_x1": 172.8, "r_y1": 375.3, "r_x2": 172.8, "r_y2": 368.9, "r_x3": 160.7, "r_y3": 368.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 382.1, "r_x1": 181.9, "r_y1": 382.1, "r_x2": 181.9, "r_y2": 375.7, "r_x3": 168.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 382.1, "r_x1": 214.9, "r_y1": 382.1, "r_x2": 214.9, "r_y2": 375.7, "r_x3": 201.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 382.1, "r_x1": 247.8, "r_y1": 382.1, "r_x2": 247.8, "r_y2": 375.7, "r_x3": 234.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 382.1, "r_x1": 280.8, "r_y1": 382.1, "r_x2": 280.8, "r_y2": 375.7, "r_x3": 267.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 388.9, "r_x1": 174.7, "r_y1": 388.9, "r_x2": 174.7, "r_y2": 382.6, "r_x3": 160.7, "r_y3": 382.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 395.8, "r_x1": 177.7, "r_y1": 395.8, "r_x2": 177.7, "r_y2": 389.4, "r_x3": 153.1, "r_y3": 389.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 320.8, "r_x1": 199.3, "r_y1": 320.8, "r_x2": 199.3, "r_y2": 314.4, "r_x3": 183.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 320.8, "r_x1": 232.3, "r_y1": 320.8, "r_x2": 232.3, "r_y2": 314.4, "r_x3": 216.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 320.8, "r_x1": 265.3, "r_y1": 320.8, "r_x2": 265.3, "r_y2": 314.4, "r_x3": 249.7, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 361.7, "r_x1": 199.3, "r_y1": 361.7, "r_x2": 199.3, "r_y2": 355.3, "r_x3": 183.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 361.7, "r_x1": 232.3, "r_y1": 361.7, "r_x2": 232.3, "r_y2": 355.3, "r_x3": 216.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 361.7, "r_x1": 265.3, "r_y1": 361.7, "r_x2": 265.3, "r_y2": 355.3, "r_x3": 249.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 361.7, "r_x1": 298.2, "r_y1": 361.7, "r_x2": 298.2, "r_y2": 355.3, "r_x3": 282.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 382.1, "r_x1": 199.3, "r_y1": 382.1, "r_x2": 199.3, "r_y2": 375.7, "r_x3": 183.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 382.1, "r_x1": 232.3, "r_y1": 382.1, "r_x2": 232.3, "r_y2": 375.7, "r_x3": 216.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 382.1, "r_x1": 265.3, "r_y1": 382.1, "r_x2": 265.3, "r_y2": 375.7, "r_x3": 249.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 382.1, "r_x1": 298.2, "r_y1": 382.1, "r_x2": 298.2, "r_y2": 375.7, "r_x3": 282.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.1, "r_y0": 419.9, "r_x1": 401.6, "r_y1": 419.9, "r_x2": 401.6, "r_y2": 411.3, "r_x3": 395.1, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 419.9, "r_x1": 412.5, "r_y1": 419.9, "r_x2": 412.5, "r_y2": 411.3, "r_x3": 407.4, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.7, "r_y0": 419.9, "r_x1": 425.3, "r_y1": 419.9, "r_x2": 425.3, "r_y2": 411.3, "r_x3": 418.7, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5, "r_y0": 419.9, "r_x1": 436.6, "r_y1": 419.9, "r_x2": 436.6, "r_y2": 411.3, "r_x3": 430.5, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.4, "r_y0": 416.2, "r_x1": 175.1, "r_y1": 416.2, "r_x2": 175.1, "r_y2": 409.8, "r_x3": 152.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.9, "r_y0": 416.2, "r_x1": 191.0, "r_y1": 416.2, "r_x2": 191.0, "r_y2": 409.8, "r_x3": 178.9, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.8, "r_y0": 416.2, "r_x1": 208.8, "r_y1": 416.2, "r_x2": 208.8, "r_y2": 409.8, "r_x3": 194.8, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.6, "r_y0": 416.2, "r_x1": 226.3, "r_y1": 416.2, "r_x2": 226.3, "r_y2": 409.8, "r_x3": 212.6, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.4, "r_y0": 416.2, "r_x1": 259.0, "r_y1": 416.2, "r_x2": 259.0, "r_y2": 409.8, "r_x3": 249.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.5, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.1, "r_x3": 244.5, "r_y3": 418.1, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.0, "r_y0": 416.2, "r_x1": 245.6, "r_y1": 416.2, "r_x2": 245.6, "r_y2": 409.8, "r_x3": 230.0, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 265.7, "r_x1": 159.6, "r_y1": 265.7, "r_x2": 159.6, "r_y2": 258.6, "r_x3": 154.5, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.7, "r_y0": 265.7, "r_x1": 185.2, "r_y1": 265.7, "r_x2": 185.2, "r_y2": 258.6, "r_x3": 164.7, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.4, "r_y0": 273.6, "r_x1": 222.1, "r_y1": 273.6, "r_x2": 222.1, "r_y2": 266.5, "r_x3": 164.4, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.2, "r_y0": 273.6, "r_x1": 232.6, "r_y1": 273.6, "r_x2": 232.6, "r_y2": 266.5, "r_x3": 224.2, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 396.4, "t": 281.0, "r": 403.0, "b": 289.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.4, "r_y0": 289.5, "r_x1": 403.0, "r_y1": 289.5, "r_x2": 403.0, "r_y2": 281.0, "r_x3": 396.4, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 418.6, "t": 280.9, "r": 425.1, "b": 289.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 289.4, "r_x1": 425.1, "r_y1": 289.4, "r_x2": 425.1, "r_y2": 280.9, "r_x3": 418.6, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 395.7, "t": 303.2, "r": 402.3, "b": 311.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.7, "r_y0": 311.8, "r_x1": 402.3, "r_y1": 311.8, "r_x2": 402.3, "r_y2": 303.2, "r_x3": 395.7, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 407.5, "t": 303.4, "r": 414.1, "b": 311.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.5, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.4, "r_x3": 407.5, "r_y3": 303.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 407.6, "t": 314.4, "r": 414.1, "b": 322.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.6, "r_y0": 322.9, "r_x1": 414.1, "r_y1": 322.9, "r_x2": 414.1, "r_y2": 314.4, "r_x3": 407.6, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 418.5, "t": 292.1, "r": 425.1, "b": 300.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 300.6, "r_x1": 425.1, "r_y1": 300.6, "r_x2": 425.1, "r_y2": 292.1, "r_x3": 418.5, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 429.6, "t": 292.1, "r": 436.2, "b": 300.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.6, "r_x1": 436.2, "r_y1": 300.6, "r_x2": 436.2, "r_y2": 292.1, "r_x3": 429.6, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 440.7, "t": 292.0, "r": 447.2, "b": 300.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7, "r_y0": 300.5, "r_x1": 447.2, "r_y1": 300.5, "r_x2": 447.2, "r_y2": 292.0, "r_x3": 440.7, "r_y3": 292.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 418.6, "t": 303.3, "r": 425.2, "b": 311.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 311.8, "r_x1": 425.2, "r_y1": 311.8, "r_x2": 425.2, "r_y2": 303.3, "r_x3": 418.6, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 429.7, "t": 303.3, "r": 436.3, "b": 311.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 311.8, "r_x1": 436.3, "r_y1": 311.8, "r_x2": 436.3, "r_y2": 303.3, "r_x3": 429.7, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 440.8, "t": 303.2, "r": 447.4, "b": 311.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.7, "r_x1": 447.4, "r_y1": 311.7, "r_x2": 447.4, "r_y2": 303.2, "r_x3": 440.8, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 418.6, "t": 314.6, "r": 425.2, "b": 323.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 323.1, "r_x1": 425.2, "r_y1": 323.1, "r_x2": 425.2, "r_y2": 314.6, "r_x3": 418.6, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 429.7, "t": 314.6, "r": 436.3, "b": 323.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 323.1, "r_x1": 436.3, "r_y1": 323.1, "r_x2": 436.3, "r_y2": 314.6, "r_x3": 429.7, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 440.8, "t": 314.5, "r": 447.4, "b": 323.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.0, "r_x1": 447.4, "r_y1": 323.0, "r_x2": 447.4, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 407.4, "t": 325.3, "r": 414.0, "b": 333.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.8, "r_x1": 414.0, "r_y1": 333.8, "r_x2": 414.0, "r_y2": 325.3, "r_x3": 407.4, "r_y3": 325.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 418.5, "t": 325.5, "r": 425.0, "b": 334.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 334.0, "r_x1": 425.0, "r_y1": 334.0, "r_x2": 425.0, "r_y2": 325.5, "r_x3": 418.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 429.5, "t": 325.5, "r": 436.1, "b": 334.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.5, "r_y0": 334.0, "r_x1": 436.1, "r_y1": 334.0, "r_x2": 436.1, "r_y2": 325.5, "r_x3": 429.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 440.6, "t": 325.4, "r": 447.2, "b": 333.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.6, "r_y0": 333.9, "r_x1": 447.2, "r_y1": 333.9, "r_x2": 447.2, "r_y2": 325.4, "r_x3": 440.6, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 451.9, "t": 280.2, "r": 463.5, "b": 288.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.7, "r_x1": 463.5, "r_y1": 288.7, "r_x2": 463.5, "r_y2": 280.2, "r_x3": 451.9, "r_y3": 280.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 452.2, "t": 291.6, "r": 463.8, "b": 300.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 300.1, "r_x1": 463.8, "r_y1": 300.1, "r_x2": 463.8, "r_y2": 291.6, "r_x3": 452.2, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 452.2, "t": 302.8, "r": 463.8, "b": 311.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 311.4, "r_x1": 463.8, "r_y1": 311.4, "r_x2": 463.8, "r_y2": 302.8, "r_x3": 452.2, "r_y3": 302.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 452.1, "t": 314.1, "r": 463.7, "b": 322.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.6, "r_x1": 463.7, "r_y1": 322.6, "r_x2": 463.7, "r_y2": 314.1, "r_x3": 452.1, "r_y3": 314.1, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 452.3, "t": 325.5, "r": 463.9, "b": 334.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 334.0, "r_x1": 463.9, "r_y1": 334.0, "r_x2": 463.9, "r_y2": 325.5, "r_x3": 452.3, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 396.1, "t": 314.5, "r": 402.7, "b": 323.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.0, "r_x1": 402.7, "r_y1": 323.0, "r_x2": 402.7, "r_y2": 314.5, "r_x3": 396.1, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 396.0, "t": 325.4, "r": 402.6, "b": 333.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.9, "r_x1": 402.6, "r_y1": 333.9, "r_x2": 402.6, "r_y2": 325.4, "r_x3": 396.0, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.3, "t": 292.3, "r": 402.8, "b": 300.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 300.8, "r_x1": 402.8, "r_y1": 300.8, "r_x2": 402.8, "r_y2": 292.3, "r_x3": 396.3, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 408.5, "t": 281.0, "r": 413.6, "b": 289.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.5, "r_y0": 289.5, "r_x1": 413.6, "r_y1": 289.5, "r_x2": 413.6, "r_y2": 281.0, "r_x3": 408.5, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 430.6, "t": 280.5, "r": 435.6, "b": 289.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.6, "r_y0": 289.0, "r_x1": 435.6, "r_y1": 289.0, "r_x2": 435.6, "r_y2": 280.5, "r_x3": 430.6, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 441.1, "t": 280.4, "r": 446.1, "b": 288.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.1, "r_y0": 288.9, "r_x1": 446.1, "r_y1": 288.9, "r_x2": 446.1, "r_y2": 280.4, "r_x3": 441.1, "r_y3": 280.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 408.0, "t": 292.1, "r": 414.0, "b": 300.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.0, "r_y0": 300.7, "r_x1": 414.0, "r_y1": 300.7, "r_x2": 414.0, "r_y2": 292.1, "r_x3": 408.0, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 441.3, "t": 411.2, "r": 452.9, "b": 419.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.3, "r_y0": 419.7, "r_x1": 452.9, "r_y1": 419.7, "r_x2": 452.9, "r_y2": 411.2, "r_x3": 441.3, "r_y3": 411.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 393.8, "t": 399.8, "r": 432.5, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 406.9, "r_x1": 432.5, "r_y1": 406.9, "r_x2": 432.5, "r_y2": 399.8, "r_x3": 393.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 434.6, "t": 399.8, "r": 438.8, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.6, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.8, "r_x3": 434.6, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 440.9, "t": 399.8, "r": 463.2, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.9, "r_y0": 406.9, "r_x1": 463.2, "r_y1": 406.9, "r_x2": 463.2, "r_y2": 399.8, "r_x3": 440.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 384.1, "t": 258.5, "r": 414.0, "b": 265.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.1, "r_y0": 265.7, "r_x1": 414.0, "r_y1": 265.7, "r_x2": 414.0, "r_y2": 258.5, "r_x3": 384.1, "r_y3": 258.5, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 393.8, "t": 266.7, "r": 451.5, "b": 273.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 273.8, "r_x1": 451.5, "r_y1": 273.8, "r_x2": 451.5, "r_y2": 266.7, "r_x3": 393.8, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 453.6, "t": 266.7, "r": 462.0, "b": 273.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.6, "r_y0": 273.8, "r_x1": 462.0, "r_y1": 273.8, "r_x2": 462.0, "r_y2": 266.7, "r_x3": 453.6, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 151.8, "t": 399.8, "r": 233.9, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.8, "r_y0": 406.9, "r_x1": 233.9, "r_y1": 406.9, "r_x2": 233.9, "r_y2": 399.8, "r_x3": 151.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 236.0, "t": 399.8, "r": 244.4, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.0, "r_y0": 406.9, "r_x1": 244.4, "r_y1": 406.9, "r_x2": 244.4, "r_y2": 399.8, "r_x3": 236.0, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 246.5, "t": 399.8, "r": 268.8, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.5, "r_y0": 406.9, "r_x1": 268.8, "r_y1": 406.9, "r_x2": 268.8, "r_y2": 399.8, "r_x3": 246.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 154.3, "t": 213.6, "r": 159.8, "b": 220.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3, "r_y0": 220.7, "r_x1": 159.8, "r_y1": 220.7, "r_x2": 159.8, "r_y2": 213.6, "r_x3": 154.3, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 321.1, "t": 213.6, "r": 326.5, "b": 220.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.1, "r_y0": 220.7, "r_x1": 326.5, "r_y1": 220.7, "r_x2": 326.5, "r_y2": 213.6, "r_x3": 321.1, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 153.1, "t": 280.3, "r": 175.8, "b": 286.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 286.7, "r_x1": 175.8, "r_y1": 286.7, "r_x2": 175.8, "r_y2": 280.3, "r_x3": 153.1, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 160.7, "t": 287.1, "r": 172.8, "b": 293.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 293.5, "r_x1": 172.8, "r_y1": 293.5, "r_x2": 172.8, "r_y2": 287.1, "r_x3": 160.7, "r_y3": 287.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 168.2, "t": 293.9, "r": 177.9, "b": 300.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 300.3, "r_x1": 177.9, "r_y1": 300.3, "r_x2": 177.9, "r_y2": 293.9, "r_x3": 168.2, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 263.4, "t": 293.9, "r": 278.9, "b": 300.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.4, "r_y0": 300.3, "r_x1": 278.9, "r_y1": 300.3, "r_x2": 278.9, "r_y2": 293.9, "r_x3": 263.4, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 280.8, "t": 293.9, "r": 290.5, "b": 300.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.8, "r_y0": 300.3, "r_x1": 290.5, "r_y1": 300.3, "r_x2": 290.5, "r_y2": 293.9, "r_x3": 280.8, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 335.9, "t": 293.9, "r": 351.5, "b": 300.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.9, "r_y0": 300.3, "r_x1": 351.5, "r_y1": 300.3, "r_x2": 351.5, "r_y2": 293.9, "r_x3": 335.9, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 160.7, "t": 300.8, "r": 174.7, "b": 307.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 307.1, "r_x1": 174.7, "r_y1": 307.1, "r_x2": 174.7, "r_y2": 300.8, "r_x3": 160.7, "r_y3": 300.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 160.7, "t": 307.6, "r": 172.8, "b": 314.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 314.0, "r_x1": 172.8, "r_y1": 314.0, "r_x2": 172.8, "r_y2": 307.6, "r_x3": 160.7, "r_y3": 307.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 168.2, "t": 314.4, "r": 181.9, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 320.8, "r_x1": 181.9, "r_y1": 320.8, "r_x2": 181.9, "r_y2": 314.4, "r_x3": 168.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 201.2, "t": 314.4, "r": 214.9, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 320.8, "r_x1": 214.9, "r_y1": 320.8, "r_x2": 214.9, "r_y2": 314.4, "r_x3": 201.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 234.2, "t": 314.4, "r": 247.8, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 320.8, "r_x1": 247.8, "r_y1": 320.8, "r_x2": 247.8, "r_y2": 314.4, "r_x3": 234.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 160.7, "t": 321.2, "r": 174.7, "b": 327.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 327.6, "r_x1": 174.7, "r_y1": 327.6, "r_x2": 174.7, "r_y2": 321.2, "r_x3": 160.7, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 160.7, "t": 328.0, "r": 172.8, "b": 334.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 334.4, "r_x1": 172.8, "r_y1": 334.4, "r_x2": 172.8, "r_y2": 328.0, "r_x3": 160.7, "r_y3": 328.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 168.2, "t": 334.8, "r": 373.1, "b": 341.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 341.2, "r_x1": 373.1, "r_y1": 341.2, "r_x2": 373.1, "r_y2": 334.8, "r_x3": 168.2, "r_y3": 334.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 160.7, "t": 341.7, "r": 174.7, "b": 348.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 348.0, "r_x1": 174.7, "r_y1": 348.0, "r_x2": 174.7, "r_y2": 341.7, "r_x3": 160.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 160.7, "t": 348.5, "r": 172.8, "b": 354.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 354.9, "r_x1": 172.8, "r_y1": 354.9, "r_x2": 172.8, "r_y2": 348.5, "r_x3": 160.7, "r_y3": 348.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 168.2, "t": 355.3, "r": 181.9, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 361.7, "r_x1": 181.9, "r_y1": 361.7, "r_x2": 181.9, "r_y2": 355.3, "r_x3": 168.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 201.2, "t": 355.3, "r": 214.9, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 361.7, "r_x1": 214.9, "r_y1": 361.7, "r_x2": 214.9, "r_y2": 355.3, "r_x3": 201.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 234.2, "t": 355.3, "r": 247.8, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 361.7, "r_x1": 247.8, "r_y1": 361.7, "r_x2": 247.8, "r_y2": 355.3, "r_x3": 234.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 267.2, "t": 355.3, "r": 280.8, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 361.7, "r_x1": 280.8, "r_y1": 361.7, "r_x2": 280.8, "r_y2": 355.3, "r_x3": 267.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 160.7, "t": 362.1, "r": 174.7, "b": 368.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 368.5, "r_x1": 174.7, "r_y1": 368.5, "r_x2": 174.7, "r_y2": 362.1, "r_x3": 160.7, "r_y3": 362.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 160.7, "t": 368.9, "r": 172.8, "b": 375.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 375.3, "r_x1": 172.8, "r_y1": 375.3, "r_x2": 172.8, "r_y2": 368.9, "r_x3": 160.7, "r_y3": 368.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 168.2, "t": 375.7, "r": 181.9, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 382.1, "r_x1": 181.9, "r_y1": 382.1, "r_x2": 181.9, "r_y2": 375.7, "r_x3": 168.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 201.2, "t": 375.7, "r": 214.9, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 382.1, "r_x1": 214.9, "r_y1": 382.1, "r_x2": 214.9, "r_y2": 375.7, "r_x3": 201.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 234.2, "t": 375.7, "r": 247.8, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 382.1, "r_x1": 247.8, "r_y1": 382.1, "r_x2": 247.8, "r_y2": 375.7, "r_x3": 234.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 267.2, "t": 375.7, "r": 280.8, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 382.1, "r_x1": 280.8, "r_y1": 382.1, "r_x2": 280.8, "r_y2": 375.7, "r_x3": 267.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 160.7, "t": 382.6, "r": 174.7, "b": 388.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 388.9, "r_x1": 174.7, "r_y1": 388.9, "r_x2": 174.7, "r_y2": 382.6, "r_x3": 160.7, "r_y3": 382.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 153.1, "t": 389.4, "r": 177.7, "b": 395.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 395.8, "r_x1": 177.7, "r_y1": 395.8, "r_x2": 177.7, "r_y2": 389.4, "r_x3": 153.1, "r_y3": 389.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.8, "t": 314.4, "r": 199.3, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 320.8, "r_x1": 199.3, "r_y1": 320.8, "r_x2": 199.3, "r_y2": 314.4, "r_x3": 183.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 216.8, "t": 314.4, "r": 232.3, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 320.8, "r_x1": 232.3, "r_y1": 320.8, "r_x2": 232.3, "r_y2": 314.4, "r_x3": 216.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 249.7, "t": 314.4, "r": 265.3, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 320.8, "r_x1": 265.3, "r_y1": 320.8, "r_x2": 265.3, "r_y2": 314.4, "r_x3": 249.7, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 183.8, "t": 355.3, "r": 199.3, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 361.7, "r_x1": 199.3, "r_y1": 361.7, "r_x2": 199.3, "r_y2": 355.3, "r_x3": 183.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 216.8, "t": 355.3, "r": 232.3, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 361.7, "r_x1": 232.3, "r_y1": 361.7, "r_x2": 232.3, "r_y2": 355.3, "r_x3": 216.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 249.7, "t": 355.3, "r": 265.3, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 361.7, "r_x1": 265.3, "r_y1": 361.7, "r_x2": 265.3, "r_y2": 355.3, "r_x3": 249.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 282.7, "t": 355.3, "r": 298.2, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 361.7, "r_x1": 298.2, "r_y1": 361.7, "r_x2": 298.2, "r_y2": 355.3, "r_x3": 282.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.8, "t": 375.7, "r": 199.3, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 382.1, "r_x1": 199.3, "r_y1": 382.1, "r_x2": 199.3, "r_y2": 375.7, "r_x3": 183.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 216.8, "t": 375.7, "r": 232.3, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 382.1, "r_x1": 232.3, "r_y1": 382.1, "r_x2": 232.3, "r_y2": 375.7, "r_x3": 216.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 249.7, "t": 375.7, "r": 265.3, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 382.1, "r_x1": 265.3, "r_y1": 382.1, "r_x2": 265.3, "r_y2": 375.7, "r_x3": 249.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 282.7, "t": 375.7, "r": 298.2, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 382.1, "r_x1": 298.2, "r_y1": 382.1, "r_x2": 298.2, "r_y2": 375.7, "r_x3": 282.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 395.1, "t": 411.3, "r": 401.6, "b": 419.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.1, "r_y0": 419.9, "r_x1": 401.6, "r_y1": 419.9, "r_x2": 401.6, "r_y2": 411.3, "r_x3": 395.1, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 407.4, "t": 411.3, "r": 412.5, "b": 419.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 419.9, "r_x1": 412.5, "r_y1": 419.9, "r_x2": 412.5, "r_y2": 411.3, "r_x3": 407.4, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 418.7, "t": 411.3, "r": 425.3, "b": 419.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.7, "r_y0": 419.9, "r_x1": 425.3, "r_y1": 419.9, "r_x2": 425.3, "r_y2": 411.3, "r_x3": 418.7, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 430.5, "t": 411.3, "r": 436.6, "b": 419.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5, "r_y0": 419.9, "r_x1": 436.6, "r_y1": 419.9, "r_x2": 436.6, "r_y2": 411.3, "r_x3": 430.5, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 152.4, "t": 409.8, "r": 175.1, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.4, "r_y0": 416.2, "r_x1": 175.1, "r_y1": 416.2, "r_x2": 175.1, "r_y2": 409.8, "r_x3": 152.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 178.9, "t": 409.8, "r": 191.0, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.9, "r_y0": 416.2, "r_x1": 191.0, "r_y1": 416.2, "r_x2": 191.0, "r_y2": 409.8, "r_x3": 178.9, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 194.8, "t": 409.8, "r": 208.8, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.8, "r_y0": 416.2, "r_x1": 208.8, "r_y1": 416.2, "r_x2": 208.8, "r_y2": 409.8, "r_x3": 194.8, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 212.6, "t": 409.8, "r": 226.3, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.6, "r_y0": 416.2, "r_x1": 226.3, "r_y1": 416.2, "r_x2": 226.3, "r_y2": 409.8, "r_x3": 212.6, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 249.4, "t": 409.8, "r": 259.0, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.4, "r_y0": 416.2, "r_x1": 259.0, "r_y1": 416.2, "r_x2": 259.0, "r_y2": 409.8, "r_x3": 249.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 244.5, "t": 418.1, "r": 269.1, "b": 424.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.5, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.1, "r_x3": 244.5, "r_y3": 418.1, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 230.0, "t": 409.8, "r": 245.6, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.0, "r_y0": 416.2, "r_x1": 245.6, "r_y1": 416.2, "r_x2": 245.6, "r_y2": 409.8, "r_x3": 230.0, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 154.5, "t": 258.6, "r": 159.6, "b": 265.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 265.7, "r_x1": 159.6, "r_y1": 265.7, "r_x2": 159.6, "r_y2": 258.6, "r_x3": 154.5, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 164.7, "t": 258.6, "r": 185.2, "b": 265.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.7, "r_y0": 265.7, "r_x1": 185.2, "r_y1": 265.7, "r_x2": 185.2, "r_y2": 258.6, "r_x3": 164.7, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 164.4, "t": 266.5, "r": 222.1, "b": 273.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.4, "r_y0": 273.6, "r_x1": 222.1, "r_y1": 273.6, "r_x2": 222.1, "r_y2": 266.5, "r_x3": 164.4, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 224.2, "t": 266.5, "r": 232.6, "b": 273.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.2, "r_y0": 273.6, "r_x1": 232.6, "r_y1": 273.6, "r_x2": 232.6, "r_y2": 266.5, "r_x3": 224.2, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 2, "page_no": 1, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 452.3, "r": 480.6, "b": 520.9, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 461.1, "r_x1": 161.3, "r_y1": 461.1, "r_x2": 161.3, "r_y2": 452.3, "r_x3": 134.8, "r_y3": 452.3, "coord_origin": "TOPLEFT" }, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.3, "r_y0": 461.1, "r_x1": 226.3, "r_y1": 461.1, "r_x2": 226.3, "r_y2": 452.3, "r_x3": 164.3, "r_y3": 452.3, "coord_origin": "TOPLEFT" }, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.0, "r_y0": 461.1, "r_x1": 480.6, "r_y1": 461.1, "r_x2": 480.6, "r_y2": 452.3, "r_x3": 230.0, "r_y3": 452.3, "coord_origin": "TOPLEFT" }, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 473.1, "r_x1": 480.6, "r_y1": 473.1, "r_x2": 480.6, "r_y2": 464.3, "r_x3": 134.8, "r_y3": 464.3, "coord_origin": "TOPLEFT" }, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 485.0, "r_x1": 480.6, "r_y1": 485.0, "r_x2": 480.6, "r_y2": 476.2, "r_x3": 134.8, "r_y3": 476.2, "coord_origin": "TOPLEFT" }, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 497.0, "r_x1": 480.6, "r_y1": 497.0, "r_x2": 480.6, "r_y2": 488.2, "r_x3": 134.8, "r_y3": 488.2, "coord_origin": "TOPLEFT" }, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 508.9, "r_x1": 480.6, "r_y1": 508.9, "r_x2": 480.6, "r_y2": 500.1, "r_x3": 134.8, "r_y3": 500.1, "coord_origin": "TOPLEFT" }, "text": "area of research, in which many novel machine learning algorithms are being", "orig": "area of research, in which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 520.9, "r_x1": 313.2, "r_y1": 520.9, "r_x2": 313.2, "r_y2": 512.1, "r_x3": 134.8, "r_y3": 512.1, "coord_origin": "TOPLEFT" }, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "today, table detection in documents is a well understood problem, and the latest state-of-the-art (SOTA) object detection methods provide an accuracy comparable to human observers [7,8,10,14,23]. On the other hand, the problem of table structure recognition (TSR) is a lot more challenging and remains a very active area of research, in which many novel machine learning algorithms are being explored [3,4,5,9,11,12,13,14,17,18,21,22]." }, { "label": "text", "id": 0, "page_no": 1, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 524.6, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.6, "r_x3": 149.7, "r_y3": 524.6, "coord_origin": "TOPLEFT" }, "text": "Recently emerging SOTA methods for table structure recognition employ", "orig": "Recently emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 480.6, "r_y1": 581.2, "r_x2": 480.6, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 421.5, "r_y1": 664.9, "r_x2": 421.5, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Recently emerging SOTA methods for table structure recognition employ transformer-based models, in which an image of the table is provided to the network in order to predict the structure of the table as a sequence of tokens. These image-to-sequence (Im2Seq) models are extremely powerful, since they allow for a purely data-driven solution. The tokens of the sequence typically belong to a markup language such as HTML, Latex or Markdown, which allow to describe table structure as rows, columns and spanning cells in various configurations. In Figure 1, we illustrate how HTML is used to represent the table-structure of a particular example table. Public table-structure data sets such as PubTabNet [22], and FinTabNet [21], which were created in a semi-automated way from paired PDF and HTML sources (e.g. PubMed Central), popularized primarily the use of HTML as ground-truth representation format for TSR." } ], "body": [ { "label": "caption", "id": 4, "page_no": 1, "cluster": { "id": 4, "label": "caption", "bbox": { "l": 134.8, "t": 126.3, "r": 480.6, "b": 200.2, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 134.3, "r_x1": 162.6, "r_y1": 134.3, "r_x2": 162.6, "r_y2": 126.3, "r_x3": 134.8, "r_y3": 126.3, "coord_origin": "TOPLEFT" }, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.1, "r_y0": 134.5, "r_x1": 480.6, "r_y1": 134.5, "r_x2": 480.6, "r_y2": 126.4, "r_x3": 167.1, "r_y3": 126.4, "coord_origin": "TOPLEFT" }, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 145.4, "r_x1": 480.6, "r_y1": 145.4, "r_x2": 480.6, "r_y2": 137.4, "r_x3": 134.8, "r_y3": 137.4, "coord_origin": "TOPLEFT" }, "text": "table-example with complex row and column headers, including a 2D empty span,", "orig": "table-example with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 156.4, "r_x1": 148.0, "r_y1": 156.4, "r_x2": 148.0, "r_y2": 148.3, "r_x3": 134.8, "r_y3": 148.3, "coord_origin": "TOPLEFT" }, "text": "(B)", "orig": "(B)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.4, "r_y0": 156.4, "r_x1": 480.6, "r_y1": 156.4, "r_x2": 480.6, "r_y2": 148.3, "r_x3": 152.4, "r_y3": 148.3, "coord_origin": "TOPLEFT" }, "text": "minimal graphical representation of table structure using rectangular layout, (C)", "orig": "minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 167.3, "r_x1": 480.6, "r_y1": 167.3, "r_x2": 480.6, "r_y2": 159.3, "r_x3": 134.8, "r_y3": 159.3, "coord_origin": "TOPLEFT" }, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 178.3, "r_x1": 480.6, "r_y1": 178.3, "r_x2": 480.6, "r_y2": 170.2, "r_x3": 134.8, "r_y3": 170.2, "coord_origin": "TOPLEFT" }, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 189.3, "r_x1": 480.6, "r_y1": 189.3, "r_x2": 480.6, "r_y2": 181.2, "r_x3": 134.8, "r_y3": 181.2, "coord_origin": "TOPLEFT" }, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 200.2, "r_x1": 460.9, "r_y1": 200.2, "r_x2": 460.9, "r_y2": 192.2, "r_x3": 134.8, "r_y3": 192.2, "coord_origin": "TOPLEFT" }, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 1. Comparison between HTML and OTSL table structure representation: (A) table-example with complex row and column headers, including a 2D empty span, (B) minimal graphical representation of table structure using rectangular layout, (C) HTML representation, (D) OTSL representation. This example demonstrates many of the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case), its reduced sequence length (55 versus 30) and a enhanced internal structure (variable token sequence length per row in HTML versus a fixed length of rows in OTSL)." }, { "label": "picture", "id": 1, "page_no": 1, "cluster": { "id": 1, "label": "picture", "bbox": { "l": 148.5, "t": 208.4, "r": 464.4, "b": 425.8, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.4, "r_y0": 289.5, "r_x1": 403.0, "r_y1": 289.5, "r_x2": 403.0, "r_y2": 281.0, "r_x3": 396.4, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 289.4, "r_x1": 425.1, "r_y1": 289.4, "r_x2": 425.1, "r_y2": 280.9, "r_x3": 418.6, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.7, "r_y0": 311.8, "r_x1": 402.3, "r_y1": 311.8, "r_x2": 402.3, "r_y2": 303.2, "r_x3": 395.7, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.5, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.4, "r_x3": 407.5, "r_y3": 303.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.6, "r_y0": 322.9, "r_x1": 414.1, "r_y1": 322.9, "r_x2": 414.1, "r_y2": 314.4, "r_x3": 407.6, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 300.6, "r_x1": 425.1, "r_y1": 300.6, "r_x2": 425.1, "r_y2": 292.1, "r_x3": 418.5, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.6, "r_x1": 436.2, "r_y1": 300.6, "r_x2": 436.2, "r_y2": 292.1, "r_x3": 429.6, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7, "r_y0": 300.5, "r_x1": 447.2, "r_y1": 300.5, "r_x2": 447.2, "r_y2": 292.0, "r_x3": 440.7, "r_y3": 292.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 311.8, "r_x1": 425.2, "r_y1": 311.8, "r_x2": 425.2, "r_y2": 303.3, "r_x3": 418.6, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 311.8, "r_x1": 436.3, "r_y1": 311.8, "r_x2": 436.3, "r_y2": 303.3, "r_x3": 429.7, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.7, "r_x1": 447.4, "r_y1": 311.7, "r_x2": 447.4, "r_y2": 303.2, "r_x3": 440.8, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 323.1, "r_x1": 425.2, "r_y1": 323.1, "r_x2": 425.2, "r_y2": 314.6, "r_x3": 418.6, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 323.1, "r_x1": 436.3, "r_y1": 323.1, "r_x2": 436.3, "r_y2": 314.6, "r_x3": 429.7, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.0, "r_x1": 447.4, "r_y1": 323.0, "r_x2": 447.4, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.8, "r_x1": 414.0, "r_y1": 333.8, "r_x2": 414.0, "r_y2": 325.3, "r_x3": 407.4, "r_y3": 325.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 334.0, "r_x1": 425.0, "r_y1": 334.0, "r_x2": 425.0, "r_y2": 325.5, "r_x3": 418.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.5, "r_y0": 334.0, "r_x1": 436.1, "r_y1": 334.0, "r_x2": 436.1, "r_y2": 325.5, "r_x3": 429.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.6, "r_y0": 333.9, "r_x1": 447.2, "r_y1": 333.9, "r_x2": 447.2, "r_y2": 325.4, "r_x3": 440.6, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.7, "r_x1": 463.5, "r_y1": 288.7, "r_x2": 463.5, "r_y2": 280.2, "r_x3": 451.9, "r_y3": 280.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 300.1, "r_x1": 463.8, "r_y1": 300.1, "r_x2": 463.8, "r_y2": 291.6, "r_x3": 452.2, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 311.4, "r_x1": 463.8, "r_y1": 311.4, "r_x2": 463.8, "r_y2": 302.8, "r_x3": 452.2, "r_y3": 302.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.6, "r_x1": 463.7, "r_y1": 322.6, "r_x2": 463.7, "r_y2": 314.1, "r_x3": 452.1, "r_y3": 314.1, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 334.0, "r_x1": 463.9, "r_y1": 334.0, "r_x2": 463.9, "r_y2": 325.5, "r_x3": 452.3, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.0, "r_x1": 402.7, "r_y1": 323.0, "r_x2": 402.7, "r_y2": 314.5, "r_x3": 396.1, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.9, "r_x1": 402.6, "r_y1": 333.9, "r_x2": 402.6, "r_y2": 325.4, "r_x3": 396.0, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 300.8, "r_x1": 402.8, "r_y1": 300.8, "r_x2": 402.8, "r_y2": 292.3, "r_x3": 396.3, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.5, "r_y0": 289.5, "r_x1": 413.6, "r_y1": 289.5, "r_x2": 413.6, "r_y2": 281.0, "r_x3": 408.5, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.6, "r_y0": 289.0, "r_x1": 435.6, "r_y1": 289.0, "r_x2": 435.6, "r_y2": 280.5, "r_x3": 430.6, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.1, "r_y0": 288.9, "r_x1": 446.1, "r_y1": 288.9, "r_x2": 446.1, "r_y2": 280.4, "r_x3": 441.1, "r_y3": 280.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.0, "r_y0": 300.7, "r_x1": 414.0, "r_y1": 300.7, "r_x2": 414.0, "r_y2": 292.1, "r_x3": 408.0, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.3, "r_y0": 419.7, "r_x1": 452.9, "r_y1": 419.7, "r_x2": 452.9, "r_y2": 411.2, "r_x3": 441.3, "r_y3": 411.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 406.9, "r_x1": 432.5, "r_y1": 406.9, "r_x2": 432.5, "r_y2": 399.8, "r_x3": 393.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.6, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.8, "r_x3": 434.6, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.9, "r_y0": 406.9, "r_x1": 463.2, "r_y1": 406.9, "r_x2": 463.2, "r_y2": 399.8, "r_x3": 440.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.1, "r_y0": 265.7, "r_x1": 414.0, "r_y1": 265.7, "r_x2": 414.0, "r_y2": 258.5, "r_x3": 384.1, "r_y3": 258.5, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 273.8, "r_x1": 451.5, "r_y1": 273.8, "r_x2": 451.5, "r_y2": 266.7, "r_x3": 393.8, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.6, "r_y0": 273.8, "r_x1": 462.0, "r_y1": 273.8, "r_x2": 462.0, "r_y2": 266.7, "r_x3": 453.6, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.8, "r_y0": 406.9, "r_x1": 233.9, "r_y1": 406.9, "r_x2": 233.9, "r_y2": 399.8, "r_x3": 151.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.0, "r_y0": 406.9, "r_x1": 244.4, "r_y1": 406.9, "r_x2": 244.4, "r_y2": 399.8, "r_x3": 236.0, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.5, "r_y0": 406.9, "r_x1": 268.8, "r_y1": 406.9, "r_x2": 268.8, "r_y2": 399.8, "r_x3": 246.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3, "r_y0": 220.7, "r_x1": 159.8, "r_y1": 220.7, "r_x2": 159.8, "r_y2": 213.6, "r_x3": 154.3, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.1, "r_y0": 220.7, "r_x1": 326.5, "r_y1": 220.7, "r_x2": 326.5, "r_y2": 213.6, "r_x3": 321.1, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 286.7, "r_x1": 175.8, "r_y1": 286.7, "r_x2": 175.8, "r_y2": 280.3, "r_x3": 153.1, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 293.5, "r_x1": 172.8, "r_y1": 293.5, "r_x2": 172.8, "r_y2": 287.1, "r_x3": 160.7, "r_y3": 287.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 300.3, "r_x1": 177.9, "r_y1": 300.3, "r_x2": 177.9, "r_y2": 293.9, "r_x3": 168.2, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.4, "r_y0": 300.3, "r_x1": 278.9, "r_y1": 300.3, "r_x2": 278.9, "r_y2": 293.9, "r_x3": 263.4, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.8, "r_y0": 300.3, "r_x1": 290.5, "r_y1": 300.3, "r_x2": 290.5, "r_y2": 293.9, "r_x3": 280.8, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.9, "r_y0": 300.3, "r_x1": 351.5, "r_y1": 300.3, "r_x2": 351.5, "r_y2": 293.9, "r_x3": 335.9, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 307.1, "r_x1": 174.7, "r_y1": 307.1, "r_x2": 174.7, "r_y2": 300.8, "r_x3": 160.7, "r_y3": 300.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 314.0, "r_x1": 172.8, "r_y1": 314.0, "r_x2": 172.8, "r_y2": 307.6, "r_x3": 160.7, "r_y3": 307.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 320.8, "r_x1": 181.9, "r_y1": 320.8, "r_x2": 181.9, "r_y2": 314.4, "r_x3": 168.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 320.8, "r_x1": 214.9, "r_y1": 320.8, "r_x2": 214.9, "r_y2": 314.4, "r_x3": 201.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 320.8, "r_x1": 247.8, "r_y1": 320.8, "r_x2": 247.8, "r_y2": 314.4, "r_x3": 234.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 327.6, "r_x1": 174.7, "r_y1": 327.6, "r_x2": 174.7, "r_y2": 321.2, "r_x3": 160.7, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 334.4, "r_x1": 172.8, "r_y1": 334.4, "r_x2": 172.8, "r_y2": 328.0, "r_x3": 160.7, "r_y3": 328.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 341.2, "r_x1": 373.1, "r_y1": 341.2, "r_x2": 373.1, "r_y2": 334.8, "r_x3": 168.2, "r_y3": 334.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 348.0, "r_x1": 174.7, "r_y1": 348.0, "r_x2": 174.7, "r_y2": 341.7, "r_x3": 160.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 354.9, "r_x1": 172.8, "r_y1": 354.9, "r_x2": 172.8, "r_y2": 348.5, "r_x3": 160.7, "r_y3": 348.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 361.7, "r_x1": 181.9, "r_y1": 361.7, "r_x2": 181.9, "r_y2": 355.3, "r_x3": 168.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 361.7, "r_x1": 214.9, "r_y1": 361.7, "r_x2": 214.9, "r_y2": 355.3, "r_x3": 201.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 361.7, "r_x1": 247.8, "r_y1": 361.7, "r_x2": 247.8, "r_y2": 355.3, "r_x3": 234.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 361.7, "r_x1": 280.8, "r_y1": 361.7, "r_x2": 280.8, "r_y2": 355.3, "r_x3": 267.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 368.5, "r_x1": 174.7, "r_y1": 368.5, "r_x2": 174.7, "r_y2": 362.1, "r_x3": 160.7, "r_y3": 362.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 375.3, "r_x1": 172.8, "r_y1": 375.3, "r_x2": 172.8, "r_y2": 368.9, "r_x3": 160.7, "r_y3": 368.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 382.1, "r_x1": 181.9, "r_y1": 382.1, "r_x2": 181.9, "r_y2": 375.7, "r_x3": 168.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 382.1, "r_x1": 214.9, "r_y1": 382.1, "r_x2": 214.9, "r_y2": 375.7, "r_x3": 201.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 382.1, "r_x1": 247.8, "r_y1": 382.1, "r_x2": 247.8, "r_y2": 375.7, "r_x3": 234.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 382.1, "r_x1": 280.8, "r_y1": 382.1, "r_x2": 280.8, "r_y2": 375.7, "r_x3": 267.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 388.9, "r_x1": 174.7, "r_y1": 388.9, "r_x2": 174.7, "r_y2": 382.6, "r_x3": 160.7, "r_y3": 382.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 395.8, "r_x1": 177.7, "r_y1": 395.8, "r_x2": 177.7, "r_y2": 389.4, "r_x3": 153.1, "r_y3": 389.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 320.8, "r_x1": 199.3, "r_y1": 320.8, "r_x2": 199.3, "r_y2": 314.4, "r_x3": 183.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 320.8, "r_x1": 232.3, "r_y1": 320.8, "r_x2": 232.3, "r_y2": 314.4, "r_x3": 216.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 320.8, "r_x1": 265.3, "r_y1": 320.8, "r_x2": 265.3, "r_y2": 314.4, "r_x3": 249.7, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 361.7, "r_x1": 199.3, "r_y1": 361.7, "r_x2": 199.3, "r_y2": 355.3, "r_x3": 183.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 361.7, "r_x1": 232.3, "r_y1": 361.7, "r_x2": 232.3, "r_y2": 355.3, "r_x3": 216.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 361.7, "r_x1": 265.3, "r_y1": 361.7, "r_x2": 265.3, "r_y2": 355.3, "r_x3": 249.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 361.7, "r_x1": 298.2, "r_y1": 361.7, "r_x2": 298.2, "r_y2": 355.3, "r_x3": 282.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 382.1, "r_x1": 199.3, "r_y1": 382.1, "r_x2": 199.3, "r_y2": 375.7, "r_x3": 183.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 382.1, "r_x1": 232.3, "r_y1": 382.1, "r_x2": 232.3, "r_y2": 375.7, "r_x3": 216.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 382.1, "r_x1": 265.3, "r_y1": 382.1, "r_x2": 265.3, "r_y2": 375.7, "r_x3": 249.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 382.1, "r_x1": 298.2, "r_y1": 382.1, "r_x2": 298.2, "r_y2": 375.7, "r_x3": 282.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.1, "r_y0": 419.9, "r_x1": 401.6, "r_y1": 419.9, "r_x2": 401.6, "r_y2": 411.3, "r_x3": 395.1, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 419.9, "r_x1": 412.5, "r_y1": 419.9, "r_x2": 412.5, "r_y2": 411.3, "r_x3": 407.4, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.7, "r_y0": 419.9, "r_x1": 425.3, "r_y1": 419.9, "r_x2": 425.3, "r_y2": 411.3, "r_x3": 418.7, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5, "r_y0": 419.9, "r_x1": 436.6, "r_y1": 419.9, "r_x2": 436.6, "r_y2": 411.3, "r_x3": 430.5, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.4, "r_y0": 416.2, "r_x1": 175.1, "r_y1": 416.2, "r_x2": 175.1, "r_y2": 409.8, "r_x3": 152.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.9, "r_y0": 416.2, "r_x1": 191.0, "r_y1": 416.2, "r_x2": 191.0, "r_y2": 409.8, "r_x3": 178.9, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.8, "r_y0": 416.2, "r_x1": 208.8, "r_y1": 416.2, "r_x2": 208.8, "r_y2": 409.8, "r_x3": 194.8, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.6, "r_y0": 416.2, "r_x1": 226.3, "r_y1": 416.2, "r_x2": 226.3, "r_y2": 409.8, "r_x3": 212.6, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.4, "r_y0": 416.2, "r_x1": 259.0, "r_y1": 416.2, "r_x2": 259.0, "r_y2": 409.8, "r_x3": 249.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.5, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.1, "r_x3": 244.5, "r_y3": 418.1, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.0, "r_y0": 416.2, "r_x1": 245.6, "r_y1": 416.2, "r_x2": 245.6, "r_y2": 409.8, "r_x3": 230.0, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 265.7, "r_x1": 159.6, "r_y1": 265.7, "r_x2": 159.6, "r_y2": 258.6, "r_x3": 154.5, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.7, "r_y0": 265.7, "r_x1": 185.2, "r_y1": 265.7, "r_x2": 185.2, "r_y2": 258.6, "r_x3": 164.7, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.4, "r_y0": 273.6, "r_x1": 222.1, "r_y1": 273.6, "r_x2": 222.1, "r_y2": 266.5, "r_x3": 164.4, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.2, "r_y0": 273.6, "r_x1": 232.6, "r_y1": 273.6, "r_x2": 232.6, "r_y2": 266.5, "r_x3": 224.2, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 396.4, "t": 281.0, "r": 403.0, "b": 289.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.4, "r_y0": 289.5, "r_x1": 403.0, "r_y1": 289.5, "r_x2": 403.0, "r_y2": 281.0, "r_x3": 396.4, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 418.6, "t": 280.9, "r": 425.1, "b": 289.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 289.4, "r_x1": 425.1, "r_y1": 289.4, "r_x2": 425.1, "r_y2": 280.9, "r_x3": 418.6, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 395.7, "t": 303.2, "r": 402.3, "b": 311.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.7, "r_y0": 311.8, "r_x1": 402.3, "r_y1": 311.8, "r_x2": 402.3, "r_y2": 303.2, "r_x3": 395.7, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 407.5, "t": 303.4, "r": 414.1, "b": 311.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.5, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.4, "r_x3": 407.5, "r_y3": 303.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 407.6, "t": 314.4, "r": 414.1, "b": 322.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.6, "r_y0": 322.9, "r_x1": 414.1, "r_y1": 322.9, "r_x2": 414.1, "r_y2": 314.4, "r_x3": 407.6, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 418.5, "t": 292.1, "r": 425.1, "b": 300.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 300.6, "r_x1": 425.1, "r_y1": 300.6, "r_x2": 425.1, "r_y2": 292.1, "r_x3": 418.5, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 429.6, "t": 292.1, "r": 436.2, "b": 300.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.6, "r_x1": 436.2, "r_y1": 300.6, "r_x2": 436.2, "r_y2": 292.1, "r_x3": 429.6, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 440.7, "t": 292.0, "r": 447.2, "b": 300.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.7, "r_y0": 300.5, "r_x1": 447.2, "r_y1": 300.5, "r_x2": 447.2, "r_y2": 292.0, "r_x3": 440.7, "r_y3": 292.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 418.6, "t": 303.3, "r": 425.2, "b": 311.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 311.8, "r_x1": 425.2, "r_y1": 311.8, "r_x2": 425.2, "r_y2": 303.3, "r_x3": 418.6, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 429.7, "t": 303.3, "r": 436.3, "b": 311.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 311.8, "r_x1": 436.3, "r_y1": 311.8, "r_x2": 436.3, "r_y2": 303.3, "r_x3": 429.7, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 440.8, "t": 303.2, "r": 447.4, "b": 311.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.7, "r_x1": 447.4, "r_y1": 311.7, "r_x2": 447.4, "r_y2": 303.2, "r_x3": 440.8, "r_y3": 303.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 418.6, "t": 314.6, "r": 425.2, "b": 323.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.6, "r_y0": 323.1, "r_x1": 425.2, "r_y1": 323.1, "r_x2": 425.2, "r_y2": 314.6, "r_x3": 418.6, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 429.7, "t": 314.6, "r": 436.3, "b": 323.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.7, "r_y0": 323.1, "r_x1": 436.3, "r_y1": 323.1, "r_x2": 436.3, "r_y2": 314.6, "r_x3": 429.7, "r_y3": 314.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 440.8, "t": 314.5, "r": 447.4, "b": 323.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.0, "r_x1": 447.4, "r_y1": 323.0, "r_x2": 447.4, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 407.4, "t": 325.3, "r": 414.0, "b": 333.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.8, "r_x1": 414.0, "r_y1": 333.8, "r_x2": 414.0, "r_y2": 325.3, "r_x3": 407.4, "r_y3": 325.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 418.5, "t": 325.5, "r": 425.0, "b": 334.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.5, "r_y0": 334.0, "r_x1": 425.0, "r_y1": 334.0, "r_x2": 425.0, "r_y2": 325.5, "r_x3": 418.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 429.5, "t": 325.5, "r": 436.1, "b": 334.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.5, "r_y0": 334.0, "r_x1": 436.1, "r_y1": 334.0, "r_x2": 436.1, "r_y2": 325.5, "r_x3": 429.5, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 440.6, "t": 325.4, "r": 447.2, "b": 333.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.6, "r_y0": 333.9, "r_x1": 447.2, "r_y1": 333.9, "r_x2": 447.2, "r_y2": 325.4, "r_x3": 440.6, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 451.9, "t": 280.2, "r": 463.5, "b": 288.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.7, "r_x1": 463.5, "r_y1": 288.7, "r_x2": 463.5, "r_y2": 280.2, "r_x3": 451.9, "r_y3": 280.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 452.2, "t": 291.6, "r": 463.8, "b": 300.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 300.1, "r_x1": 463.8, "r_y1": 300.1, "r_x2": 463.8, "r_y2": 291.6, "r_x3": 452.2, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 452.2, "t": 302.8, "r": 463.8, "b": 311.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.2, "r_y0": 311.4, "r_x1": 463.8, "r_y1": 311.4, "r_x2": 463.8, "r_y2": 302.8, "r_x3": 452.2, "r_y3": 302.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 452.1, "t": 314.1, "r": 463.7, "b": 322.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.6, "r_x1": 463.7, "r_y1": 322.6, "r_x2": 463.7, "r_y2": 314.1, "r_x3": 452.1, "r_y3": 314.1, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 452.3, "t": 325.5, "r": 463.9, "b": 334.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 334.0, "r_x1": 463.9, "r_y1": 334.0, "r_x2": 463.9, "r_y2": 325.5, "r_x3": 452.3, "r_y3": 325.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 396.1, "t": 314.5, "r": 402.7, "b": 323.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.0, "r_x1": 402.7, "r_y1": 323.0, "r_x2": 402.7, "r_y2": 314.5, "r_x3": 396.1, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 396.0, "t": 325.4, "r": 402.6, "b": 333.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.9, "r_x1": 402.6, "r_y1": 333.9, "r_x2": 402.6, "r_y2": 325.4, "r_x3": 396.0, "r_y3": 325.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.3, "t": 292.3, "r": 402.8, "b": 300.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 300.8, "r_x1": 402.8, "r_y1": 300.8, "r_x2": 402.8, "r_y2": 292.3, "r_x3": 396.3, "r_y3": 292.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 408.5, "t": 281.0, "r": 413.6, "b": 289.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.5, "r_y0": 289.5, "r_x1": 413.6, "r_y1": 289.5, "r_x2": 413.6, "r_y2": 281.0, "r_x3": 408.5, "r_y3": 281.0, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 430.6, "t": 280.5, "r": 435.6, "b": 289.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.6, "r_y0": 289.0, "r_x1": 435.6, "r_y1": 289.0, "r_x2": 435.6, "r_y2": 280.5, "r_x3": 430.6, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 441.1, "t": 280.4, "r": 446.1, "b": 288.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.1, "r_y0": 288.9, "r_x1": 446.1, "r_y1": 288.9, "r_x2": 446.1, "r_y2": 280.4, "r_x3": 441.1, "r_y3": 280.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 408.0, "t": 292.1, "r": 414.0, "b": 300.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.0, "r_y0": 300.7, "r_x1": 414.0, "r_y1": 300.7, "r_x2": 414.0, "r_y2": 292.1, "r_x3": 408.0, "r_y3": 292.1, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 441.3, "t": 411.2, "r": 452.9, "b": 419.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.3, "r_y0": 419.7, "r_x1": 452.9, "r_y1": 419.7, "r_x2": 452.9, "r_y2": 411.2, "r_x3": 441.3, "r_y3": 411.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 393.8, "t": 399.8, "r": 432.5, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 406.9, "r_x1": 432.5, "r_y1": 406.9, "r_x2": 432.5, "r_y2": 399.8, "r_x3": 393.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 434.6, "t": 399.8, "r": 438.8, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.6, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.8, "r_x3": 434.6, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 440.9, "t": 399.8, "r": 463.2, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.9, "r_y0": 406.9, "r_x1": 463.2, "r_y1": 406.9, "r_x2": 463.2, "r_y2": 399.8, "r_x3": 440.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 384.1, "t": 258.5, "r": 414.0, "b": 265.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.1, "r_y0": 265.7, "r_x1": 414.0, "r_y1": 265.7, "r_x2": 414.0, "r_y2": 258.5, "r_x3": 384.1, "r_y3": 258.5, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 393.8, "t": 266.7, "r": 451.5, "b": 273.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.8, "r_y0": 273.8, "r_x1": 451.5, "r_y1": 273.8, "r_x2": 451.5, "r_y2": 266.7, "r_x3": 393.8, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 453.6, "t": 266.7, "r": 462.0, "b": 273.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.6, "r_y0": 273.8, "r_x1": 462.0, "r_y1": 273.8, "r_x2": 462.0, "r_y2": 266.7, "r_x3": 453.6, "r_y3": 266.7, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 151.8, "t": 399.8, "r": 233.9, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.8, "r_y0": 406.9, "r_x1": 233.9, "r_y1": 406.9, "r_x2": 233.9, "r_y2": 399.8, "r_x3": 151.8, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 236.0, "t": 399.8, "r": 244.4, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.0, "r_y0": 406.9, "r_x1": 244.4, "r_y1": 406.9, "r_x2": 244.4, "r_y2": 399.8, "r_x3": 236.0, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 246.5, "t": 399.8, "r": 268.8, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.5, "r_y0": 406.9, "r_x1": 268.8, "r_y1": 406.9, "r_x2": 268.8, "r_y2": 399.8, "r_x3": 246.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 154.3, "t": 213.6, "r": 159.8, "b": 220.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.3, "r_y0": 220.7, "r_x1": 159.8, "r_y1": 220.7, "r_x2": 159.8, "r_y2": 213.6, "r_x3": 154.3, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 321.1, "t": 213.6, "r": 326.5, "b": 220.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.1, "r_y0": 220.7, "r_x1": 326.5, "r_y1": 220.7, "r_x2": 326.5, "r_y2": 213.6, "r_x3": 321.1, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 153.1, "t": 280.3, "r": 175.8, "b": 286.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 286.7, "r_x1": 175.8, "r_y1": 286.7, "r_x2": 175.8, "r_y2": 280.3, "r_x3": 153.1, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 160.7, "t": 287.1, "r": 172.8, "b": 293.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 293.5, "r_x1": 172.8, "r_y1": 293.5, "r_x2": 172.8, "r_y2": 287.1, "r_x3": 160.7, "r_y3": 287.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 168.2, "t": 293.9, "r": 177.9, "b": 300.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 300.3, "r_x1": 177.9, "r_y1": 300.3, "r_x2": 177.9, "r_y2": 293.9, "r_x3": 168.2, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 263.4, "t": 293.9, "r": 278.9, "b": 300.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.4, "r_y0": 300.3, "r_x1": 278.9, "r_y1": 300.3, "r_x2": 278.9, "r_y2": 293.9, "r_x3": 263.4, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 280.8, "t": 293.9, "r": 290.5, "b": 300.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.8, "r_y0": 300.3, "r_x1": 290.5, "r_y1": 300.3, "r_x2": 290.5, "r_y2": 293.9, "r_x3": 280.8, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 335.9, "t": 293.9, "r": 351.5, "b": 300.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.9, "r_y0": 300.3, "r_x1": 351.5, "r_y1": 300.3, "r_x2": 351.5, "r_y2": 293.9, "r_x3": 335.9, "r_y3": 293.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 160.7, "t": 300.8, "r": 174.7, "b": 307.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 307.1, "r_x1": 174.7, "r_y1": 307.1, "r_x2": 174.7, "r_y2": 300.8, "r_x3": 160.7, "r_y3": 300.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 160.7, "t": 307.6, "r": 172.8, "b": 314.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 314.0, "r_x1": 172.8, "r_y1": 314.0, "r_x2": 172.8, "r_y2": 307.6, "r_x3": 160.7, "r_y3": 307.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 168.2, "t": 314.4, "r": 181.9, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 320.8, "r_x1": 181.9, "r_y1": 320.8, "r_x2": 181.9, "r_y2": 314.4, "r_x3": 168.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 201.2, "t": 314.4, "r": 214.9, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 320.8, "r_x1": 214.9, "r_y1": 320.8, "r_x2": 214.9, "r_y2": 314.4, "r_x3": 201.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 234.2, "t": 314.4, "r": 247.8, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 320.8, "r_x1": 247.8, "r_y1": 320.8, "r_x2": 247.8, "r_y2": 314.4, "r_x3": 234.2, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 160.7, "t": 321.2, "r": 174.7, "b": 327.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 327.6, "r_x1": 174.7, "r_y1": 327.6, "r_x2": 174.7, "r_y2": 321.2, "r_x3": 160.7, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 160.7, "t": 328.0, "r": 172.8, "b": 334.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 334.4, "r_x1": 172.8, "r_y1": 334.4, "r_x2": 172.8, "r_y2": 328.0, "r_x3": 160.7, "r_y3": 328.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 168.2, "t": 334.8, "r": 373.1, "b": 341.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 341.2, "r_x1": 373.1, "r_y1": 341.2, "r_x2": 373.1, "r_y2": 334.8, "r_x3": 168.2, "r_y3": 334.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 160.7, "t": 341.7, "r": 174.7, "b": 348.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 348.0, "r_x1": 174.7, "r_y1": 348.0, "r_x2": 174.7, "r_y2": 341.7, "r_x3": 160.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 160.7, "t": 348.5, "r": 172.8, "b": 354.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 354.9, "r_x1": 172.8, "r_y1": 354.9, "r_x2": 172.8, "r_y2": 348.5, "r_x3": 160.7, "r_y3": 348.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 168.2, "t": 355.3, "r": 181.9, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 361.7, "r_x1": 181.9, "r_y1": 361.7, "r_x2": 181.9, "r_y2": 355.3, "r_x3": 168.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 201.2, "t": 355.3, "r": 214.9, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 361.7, "r_x1": 214.9, "r_y1": 361.7, "r_x2": 214.9, "r_y2": 355.3, "r_x3": 201.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 234.2, "t": 355.3, "r": 247.8, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 361.7, "r_x1": 247.8, "r_y1": 361.7, "r_x2": 247.8, "r_y2": 355.3, "r_x3": 234.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 267.2, "t": 355.3, "r": 280.8, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 361.7, "r_x1": 280.8, "r_y1": 361.7, "r_x2": 280.8, "r_y2": 355.3, "r_x3": 267.2, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 160.7, "t": 362.1, "r": 174.7, "b": 368.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 368.5, "r_x1": 174.7, "r_y1": 368.5, "r_x2": 174.7, "r_y2": 362.1, "r_x3": 160.7, "r_y3": 362.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 160.7, "t": 368.9, "r": 172.8, "b": 375.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 375.3, "r_x1": 172.8, "r_y1": 375.3, "r_x2": 172.8, "r_y2": 368.9, "r_x3": 160.7, "r_y3": 368.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 168.2, "t": 375.7, "r": 181.9, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.2, "r_y0": 382.1, "r_x1": 181.9, "r_y1": 382.1, "r_x2": 181.9, "r_y2": 375.7, "r_x3": 168.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 201.2, "t": 375.7, "r": 214.9, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.2, "r_y0": 382.1, "r_x1": 214.9, "r_y1": 382.1, "r_x2": 214.9, "r_y2": 375.7, "r_x3": 201.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 234.2, "t": 375.7, "r": 247.8, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.2, "r_y0": 382.1, "r_x1": 247.8, "r_y1": 382.1, "r_x2": 247.8, "r_y2": 375.7, "r_x3": 234.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 267.2, "t": 375.7, "r": 280.8, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.2, "r_y0": 382.1, "r_x1": 280.8, "r_y1": 382.1, "r_x2": 280.8, "r_y2": 375.7, "r_x3": 267.2, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 160.7, "t": 382.6, "r": 174.7, "b": 388.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.7, "r_y0": 388.9, "r_x1": 174.7, "r_y1": 388.9, "r_x2": 174.7, "r_y2": 382.6, "r_x3": 160.7, "r_y3": 382.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 153.1, "t": 389.4, "r": 177.7, "b": 395.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.1, "r_y0": 395.8, "r_x1": 177.7, "r_y1": 395.8, "r_x2": 177.7, "r_y2": 389.4, "r_x3": 153.1, "r_y3": 389.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.8, "t": 314.4, "r": 199.3, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 320.8, "r_x1": 199.3, "r_y1": 320.8, "r_x2": 199.3, "r_y2": 314.4, "r_x3": 183.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 216.8, "t": 314.4, "r": 232.3, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 320.8, "r_x1": 232.3, "r_y1": 320.8, "r_x2": 232.3, "r_y2": 314.4, "r_x3": 216.8, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 249.7, "t": 314.4, "r": 265.3, "b": 320.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 320.8, "r_x1": 265.3, "r_y1": 320.8, "r_x2": 265.3, "r_y2": 314.4, "r_x3": 249.7, "r_y3": 314.4, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 183.8, "t": 355.3, "r": 199.3, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 361.7, "r_x1": 199.3, "r_y1": 361.7, "r_x2": 199.3, "r_y2": 355.3, "r_x3": 183.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 216.8, "t": 355.3, "r": 232.3, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 361.7, "r_x1": 232.3, "r_y1": 361.7, "r_x2": 232.3, "r_y2": 355.3, "r_x3": 216.8, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 249.7, "t": 355.3, "r": 265.3, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 361.7, "r_x1": 265.3, "r_y1": 361.7, "r_x2": 265.3, "r_y2": 355.3, "r_x3": 249.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 282.7, "t": 355.3, "r": 298.2, "b": 361.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 361.7, "r_x1": 298.2, "r_y1": 361.7, "r_x2": 298.2, "r_y2": 355.3, "r_x3": 282.7, "r_y3": 355.3, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.8, "t": 375.7, "r": 199.3, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.8, "r_y0": 382.1, "r_x1": 199.3, "r_y1": 382.1, "r_x2": 199.3, "r_y2": 375.7, "r_x3": 183.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 216.8, "t": 375.7, "r": 232.3, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.8, "r_y0": 382.1, "r_x1": 232.3, "r_y1": 382.1, "r_x2": 232.3, "r_y2": 375.7, "r_x3": 216.8, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 249.7, "t": 375.7, "r": 265.3, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.7, "r_y0": 382.1, "r_x1": 265.3, "r_y1": 382.1, "r_x2": 265.3, "r_y2": 375.7, "r_x3": 249.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 282.7, "t": 375.7, "r": 298.2, "b": 382.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.7, "r_y0": 382.1, "r_x1": 298.2, "r_y1": 382.1, "r_x2": 298.2, "r_y2": 375.7, "r_x3": 282.7, "r_y3": 375.7, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 395.1, "t": 411.3, "r": 401.6, "b": 419.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.1, "r_y0": 419.9, "r_x1": 401.6, "r_y1": 419.9, "r_x2": 401.6, "r_y2": 411.3, "r_x3": 395.1, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 407.4, "t": 411.3, "r": 412.5, "b": 419.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 419.9, "r_x1": 412.5, "r_y1": 419.9, "r_x2": 412.5, "r_y2": 411.3, "r_x3": 407.4, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 418.7, "t": 411.3, "r": 425.3, "b": 419.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.7, "r_y0": 419.9, "r_x1": 425.3, "r_y1": 419.9, "r_x2": 425.3, "r_y2": 411.3, "r_x3": 418.7, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 430.5, "t": 411.3, "r": 436.6, "b": 419.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.5, "r_y0": 419.9, "r_x1": 436.6, "r_y1": 419.9, "r_x2": 436.6, "r_y2": 411.3, "r_x3": 430.5, "r_y3": 411.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 152.4, "t": 409.8, "r": 175.1, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.4, "r_y0": 416.2, "r_x1": 175.1, "r_y1": 416.2, "r_x2": 175.1, "r_y2": 409.8, "r_x3": 152.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 178.9, "t": 409.8, "r": 191.0, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.9, "r_y0": 416.2, "r_x1": 191.0, "r_y1": 416.2, "r_x2": 191.0, "r_y2": 409.8, "r_x3": 178.9, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 194.8, "t": 409.8, "r": 208.8, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.8, "r_y0": 416.2, "r_x1": 208.8, "r_y1": 416.2, "r_x2": 208.8, "r_y2": 409.8, "r_x3": 194.8, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 212.6, "t": 409.8, "r": 226.3, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.6, "r_y0": 416.2, "r_x1": 226.3, "r_y1": 416.2, "r_x2": 226.3, "r_y2": 409.8, "r_x3": 212.6, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 249.4, "t": 409.8, "r": 259.0, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.4, "r_y0": 416.2, "r_x1": 259.0, "r_y1": 416.2, "r_x2": 259.0, "r_y2": 409.8, "r_x3": 249.4, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 244.5, "t": 418.1, "r": 269.1, "b": 424.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.5, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.1, "r_x3": 244.5, "r_y3": 418.1, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 230.0, "t": 409.8, "r": 245.6, "b": 416.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.0, "r_y0": 416.2, "r_x1": 245.6, "r_y1": 416.2, "r_x2": 245.6, "r_y2": 409.8, "r_x3": 230.0, "r_y3": 409.8, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 154.5, "t": 258.6, "r": 159.6, "b": 265.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 265.7, "r_x1": 159.6, "r_y1": 265.7, "r_x2": 159.6, "r_y2": 258.6, "r_x3": 154.5, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 164.7, "t": 258.6, "r": 185.2, "b": 265.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.7, "r_y0": 265.7, "r_x1": 185.2, "r_y1": 265.7, "r_x2": 185.2, "r_y2": 258.6, "r_x3": 164.7, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 164.4, "t": 266.5, "r": 222.1, "b": 273.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.4, "r_y0": 273.6, "r_x1": 222.1, "r_y1": 273.6, "r_x2": 222.1, "r_y2": 266.5, "r_x3": 164.4, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 224.2, "t": 266.5, "r": 232.6, "b": 273.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.2, "r_y0": 273.6, "r_x1": 232.6, "r_y1": 273.6, "r_x2": 232.6, "r_y2": 266.5, "r_x3": 224.2, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 2, "page_no": 1, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 452.3, "r": 480.6, "b": 520.9, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 461.1, "r_x1": 161.3, "r_y1": 461.1, "r_x2": 161.3, "r_y2": 452.3, "r_x3": 134.8, "r_y3": 452.3, "coord_origin": "TOPLEFT" }, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.3, "r_y0": 461.1, "r_x1": 226.3, "r_y1": 461.1, "r_x2": 226.3, "r_y2": 452.3, "r_x3": 164.3, "r_y3": 452.3, "coord_origin": "TOPLEFT" }, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.0, "r_y0": 461.1, "r_x1": 480.6, "r_y1": 461.1, "r_x2": 480.6, "r_y2": 452.3, "r_x3": 230.0, "r_y3": 452.3, "coord_origin": "TOPLEFT" }, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 473.1, "r_x1": 480.6, "r_y1": 473.1, "r_x2": 480.6, "r_y2": 464.3, "r_x3": 134.8, "r_y3": 464.3, "coord_origin": "TOPLEFT" }, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 485.0, "r_x1": 480.6, "r_y1": 485.0, "r_x2": 480.6, "r_y2": 476.2, "r_x3": 134.8, "r_y3": 476.2, "coord_origin": "TOPLEFT" }, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 497.0, "r_x1": 480.6, "r_y1": 497.0, "r_x2": 480.6, "r_y2": 488.2, "r_x3": 134.8, "r_y3": 488.2, "coord_origin": "TOPLEFT" }, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 508.9, "r_x1": 480.6, "r_y1": 508.9, "r_x2": 480.6, "r_y2": 500.1, "r_x3": 134.8, "r_y3": 500.1, "coord_origin": "TOPLEFT" }, "text": "area of research, in which many novel machine learning algorithms are being", "orig": "area of research, in which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 520.9, "r_x1": 313.2, "r_y1": 520.9, "r_x2": 313.2, "r_y2": 512.1, "r_x3": 134.8, "r_y3": 512.1, "coord_origin": "TOPLEFT" }, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "today, table detection in documents is a well understood problem, and the latest state-of-the-art (SOTA) object detection methods provide an accuracy comparable to human observers [7,8,10,14,23]. On the other hand, the problem of table structure recognition (TSR) is a lot more challenging and remains a very active area of research, in which many novel machine learning algorithms are being explored [3,4,5,9,11,12,13,14,17,18,21,22]." }, { "label": "text", "id": 0, "page_no": 1, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 524.6, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.6, "r_x3": 149.7, "r_y3": 524.6, "coord_origin": "TOPLEFT" }, "text": "Recently emerging SOTA methods for table structure recognition employ", "orig": "Recently emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 480.6, "r_y1": 581.2, "r_x2": 480.6, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 421.5, "r_y1": 664.9, "r_x2": 421.5, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Recently emerging SOTA methods for table structure recognition employ transformer-based models, in which an image of the table is provided to the network in order to predict the structure of the table as a sequence of tokens. These image-to-sequence (Im2Seq) models are extremely powerful, since they allow for a purely data-driven solution. The tokens of the sequence typically belong to a markup language such as HTML, Latex or Markdown, which allow to describe table structure as rows, columns and spanning cells in various configurations. In Figure 1, we illustrate how HTML is used to represent the table-structure of a particular example table. Public table-structure data sets such as PubTabNet [22], and FinTabNet [21], which were created in a semi-automated way from paired PDF and HTML sources (e.g. PubMed Central), popularized primarily the use of HTML as ground-truth representation format for TSR." } ], "headers": [ { "label": "page_header", "id": 5, "page_no": 1, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 139.4, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2" }, { "label": "page_header", "id": 3, "page_no": 1, "cluster": { "id": 3, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.91, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 2, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 149.7, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 480.6, "r_y1": 151.6, "r_x2": 480.6, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 163.6, "r_x1": 169.6, "r_y1": 163.6, "r_x2": 169.6, "r_y2": 154.8, "r_x3": 134.8, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.9, "r_y0": 163.6, "r_x1": 194.6, "r_y1": 163.6, "r_x2": 194.6, "r_y2": 154.8, "r_x3": 173.9, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.6, "r_y0": 163.6, "r_x1": 480.6, "r_y1": 163.6, "r_x2": 480.6, "r_y2": 154.8, "r_x3": 199.6, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "for the sequence tokenization in Im2Seq models. In this paper,", "orig": "for the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 175.6, "r_x1": 480.6, "r_y1": 175.6, "r_x2": 480.6, "r_y2": 166.8, "r_x3": 134.8, "r_y3": 166.8, "coord_origin": "TOPLEFT" }, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 187.5, "r_x1": 480.6, "r_y1": 187.5, "r_x2": 480.6, "r_y2": 178.7, "r_x3": 134.8, "r_y3": 178.7, "coord_origin": "TOPLEFT" }, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 199.5, "r_x1": 480.6, "r_y1": 199.5, "r_x2": 480.6, "r_y2": 190.7, "r_x3": 134.8, "r_y3": 190.7, "coord_origin": "TOPLEFT" }, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 211.4, "r_x1": 348.4, "r_y1": 211.4, "r_x2": 348.4, "r_y2": 202.6, "r_x3": 134.8, "r_y3": 202.6, "coord_origin": "TOPLEFT" }, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 223.6, "r_x1": 480.6, "r_y1": 223.6, "r_x2": 480.6, "r_y2": 214.8, "r_x3": 149.7, "r_y3": 214.8, "coord_origin": "TOPLEFT" }, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 235.6, "r_x1": 480.6, "r_y1": 235.6, "r_x2": 480.6, "r_y2": 226.8, "r_x3": 134.8, "r_y3": 226.8, "coord_origin": "TOPLEFT" }, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 247.5, "r_x1": 480.6, "r_y1": 247.5, "r_x2": 480.6, "r_y2": 238.7, "r_x3": 134.8, "r_y3": 238.7, "coord_origin": "TOPLEFT" }, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 259.5, "r_x1": 480.6, "r_y1": 259.5, "r_x2": 480.6, "r_y2": 250.7, "r_x3": 134.8, "r_y3": 250.7, "coord_origin": "TOPLEFT" }, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 271.5, "r_x1": 480.6, "r_y1": 271.5, "r_x2": 480.6, "r_y2": 262.7, "r_x3": 134.8, "r_y3": 262.7, "coord_origin": "TOPLEFT" }, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.4, "r_x1": 480.6, "r_y1": 283.4, "r_x2": 480.6, "r_y2": 274.6, "r_x3": 134.8, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 295.4, "r_x1": 480.6, "r_y1": 295.4, "r_x2": 480.6, "r_y2": 286.6, "r_x3": 134.8, "r_y3": 286.6, "coord_origin": "TOPLEFT" }, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 307.3, "r_x1": 480.6, "r_y1": 307.3, "r_x2": 480.6, "r_y2": 298.5, "r_x3": 134.8, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 319.3, "r_x1": 480.6, "r_y1": 319.3, "r_x2": 480.6, "r_y2": 310.5, "r_x3": 134.8, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.2, "r_x1": 179.7, "r_y1": 331.2, "r_x2": 179.7, "r_y2": 322.4, "r_x3": 134.8, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 343.4, "r_x1": 480.6, "r_y1": 343.4, "r_x2": 480.6, "r_y2": 334.6, "r_x3": 149.7, "r_y3": 334.6, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 355.4, "r_x1": 480.6, "r_y1": 355.4, "r_x2": 480.6, "r_y2": 346.6, "r_x3": 134.8, "r_y3": 346.6, "coord_origin": "TOPLEFT" }, "text": "latest developments in table-structure reconstruction. In section 3 we review", "orig": "latest developments in table-structure reconstruction. In section 3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 367.4, "r_x1": 480.6, "r_y1": 367.4, "r_x2": 480.6, "r_y2": 358.6, "r_x3": 134.8, "r_y3": 358.6, "coord_origin": "TOPLEFT" }, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 379.3, "r_x1": 480.6, "r_y1": 379.3, "r_x2": 480.6, "r_y2": 370.5, "r_x3": 134.8, "r_y3": 370.5, "coord_origin": "TOPLEFT" }, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 391.3, "r_x1": 480.6, "r_y1": 391.3, "r_x2": 480.6, "r_y2": 382.5, "r_x3": 134.8, "r_y3": 382.5, "coord_origin": "TOPLEFT" }, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 403.2, "r_x1": 480.6, "r_y1": 403.2, "r_x2": 480.6, "r_y2": 394.4, "r_x3": 134.8, "r_y3": 394.4, "coord_origin": "TOPLEFT" }, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 415.2, "r_x1": 480.6, "r_y1": 415.2, "r_x2": 480.6, "r_y2": 406.4, "r_x3": 134.8, "r_y3": 406.4, "coord_origin": "TOPLEFT" }, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 427.1, "r_x1": 480.6, "r_y1": 427.1, "r_x2": 480.6, "r_y2": 418.3, "r_x3": 134.8, "r_y3": 418.3, "coord_origin": "TOPLEFT" }, "text": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "orig": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 439.1, "r_x1": 201.3, "r_y1": 439.1, "r_x2": 201.3, "r_y2": 430.3, "r_x3": 134.8, "r_y3": 430.3, "coord_origin": "TOPLEFT" }, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 472.7, "r_x1": 141.5, "r_y1": 472.7, "r_x2": 141.5, "r_y2": 462.1, "r_x3": 134.8, "r_y3": 462.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 472.7, "r_x1": 236.8, "r_y1": 472.7, "r_x2": 236.8, "r_y2": 462.1, "r_x3": 154.9, "r_y3": 462.1, "coord_origin": "TOPLEFT" }, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 497.5, "r_x1": 480.6, "r_y1": 497.5, "r_x2": 480.6, "r_y2": 488.7, "r_x3": 134.8, "r_y3": 488.7, "coord_origin": "TOPLEFT" }, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 509.4, "r_x1": 480.6, "r_y1": 509.4, "r_x2": 480.6, "r_y2": 500.6, "r_x3": 134.8, "r_y3": 500.6, "coord_origin": "TOPLEFT" }, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 521.4, "r_x1": 480.6, "r_y1": 521.4, "r_x2": 480.6, "r_y2": 512.6, "r_x3": 134.8, "r_y3": 512.6, "coord_origin": "TOPLEFT" }, "text": "variety of computer vision methods have been explored to tackle the prob-", "orig": "variety of computer vision methods have been explored to tackle the prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.6, "r_x3": 134.8, "r_y3": 524.6, "coord_origin": "TOPLEFT" }, "text": "lem of table structure recognition, i.e. the correct identification of columns,", "orig": "lem of table structure recognition, i.e. the correct identification of columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "orig": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 484.1, "r_y1": 581.2, "r_x2": 484.1, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 476.0, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.88, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 211.4, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 149.7, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 480.6, "r_y1": 151.6, "r_x2": 480.6, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 163.6, "r_x1": 169.6, "r_y1": 163.6, "r_x2": 169.6, "r_y2": 154.8, "r_x3": 134.8, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.9, "r_y0": 163.6, "r_x1": 194.6, "r_y1": 163.6, "r_x2": 194.6, "r_y2": 154.8, "r_x3": 173.9, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.6, "r_y0": 163.6, "r_x1": 480.6, "r_y1": 163.6, "r_x2": 480.6, "r_y2": 154.8, "r_x3": 199.6, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "for the sequence tokenization in Im2Seq models. In this paper,", "orig": "for the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 175.6, "r_x1": 480.6, "r_y1": 175.6, "r_x2": 480.6, "r_y2": 166.8, "r_x3": 134.8, "r_y3": 166.8, "coord_origin": "TOPLEFT" }, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 187.5, "r_x1": 480.6, "r_y1": 187.5, "r_x2": 480.6, "r_y2": 178.7, "r_x3": 134.8, "r_y3": 178.7, "coord_origin": "TOPLEFT" }, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 199.5, "r_x1": 480.6, "r_y1": 199.5, "r_x2": 480.6, "r_y2": 190.7, "r_x3": 134.8, "r_y3": 190.7, "coord_origin": "TOPLEFT" }, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 211.4, "r_x1": 348.4, "r_y1": 211.4, "r_x2": 348.4, "r_y2": 202.6, "r_x3": 134.8, "r_y3": 202.6, "coord_origin": "TOPLEFT" }, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 214.8, "r": 480.6, "b": 331.2, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 223.6, "r_x1": 480.6, "r_y1": 223.6, "r_x2": 480.6, "r_y2": 214.8, "r_x3": 149.7, "r_y3": 214.8, "coord_origin": "TOPLEFT" }, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 235.6, "r_x1": 480.6, "r_y1": 235.6, "r_x2": 480.6, "r_y2": 226.8, "r_x3": 134.8, "r_y3": 226.8, "coord_origin": "TOPLEFT" }, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 247.5, "r_x1": 480.6, "r_y1": 247.5, "r_x2": 480.6, "r_y2": 238.7, "r_x3": 134.8, "r_y3": 238.7, "coord_origin": "TOPLEFT" }, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 259.5, "r_x1": 480.6, "r_y1": 259.5, "r_x2": 480.6, "r_y2": 250.7, "r_x3": 134.8, "r_y3": 250.7, "coord_origin": "TOPLEFT" }, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 271.5, "r_x1": 480.6, "r_y1": 271.5, "r_x2": 480.6, "r_y2": 262.7, "r_x3": 134.8, "r_y3": 262.7, "coord_origin": "TOPLEFT" }, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.4, "r_x1": 480.6, "r_y1": 283.4, "r_x2": 480.6, "r_y2": 274.6, "r_x3": 134.8, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 295.4, "r_x1": 480.6, "r_y1": 295.4, "r_x2": 480.6, "r_y2": 286.6, "r_x3": 134.8, "r_y3": 286.6, "coord_origin": "TOPLEFT" }, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 307.3, "r_x1": 480.6, "r_y1": 307.3, "r_x2": 480.6, "r_y2": 298.5, "r_x3": 134.8, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 319.3, "r_x1": 480.6, "r_y1": 319.3, "r_x2": 480.6, "r_y2": 310.5, "r_x3": 134.8, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.2, "r_x1": 179.7, "r_y1": 331.2, "r_x2": 179.7, "r_y2": 322.4, "r_x3": 134.8, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 334.6, "r": 480.6, "b": 439.1, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 343.4, "r_x1": 480.6, "r_y1": 343.4, "r_x2": 480.6, "r_y2": 334.6, "r_x3": 149.7, "r_y3": 334.6, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 355.4, "r_x1": 480.6, "r_y1": 355.4, "r_x2": 480.6, "r_y2": 346.6, "r_x3": 134.8, "r_y3": 346.6, "coord_origin": "TOPLEFT" }, "text": "latest developments in table-structure reconstruction. In section 3 we review", "orig": "latest developments in table-structure reconstruction. In section 3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 367.4, "r_x1": 480.6, "r_y1": 367.4, "r_x2": 480.6, "r_y2": 358.6, "r_x3": 134.8, "r_y3": 358.6, "coord_origin": "TOPLEFT" }, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 379.3, "r_x1": 480.6, "r_y1": 379.3, "r_x2": 480.6, "r_y2": 370.5, "r_x3": 134.8, "r_y3": 370.5, "coord_origin": "TOPLEFT" }, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 391.3, "r_x1": 480.6, "r_y1": 391.3, "r_x2": 480.6, "r_y2": 382.5, "r_x3": 134.8, "r_y3": 382.5, "coord_origin": "TOPLEFT" }, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 403.2, "r_x1": 480.6, "r_y1": 403.2, "r_x2": 480.6, "r_y2": 394.4, "r_x3": 134.8, "r_y3": 394.4, "coord_origin": "TOPLEFT" }, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 415.2, "r_x1": 480.6, "r_y1": 415.2, "r_x2": 480.6, "r_y2": 406.4, "r_x3": 134.8, "r_y3": 406.4, "coord_origin": "TOPLEFT" }, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 427.1, "r_x1": 480.6, "r_y1": 427.1, "r_x2": 480.6, "r_y2": 418.3, "r_x3": 134.8, "r_y3": 418.3, "coord_origin": "TOPLEFT" }, "text": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "orig": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 439.1, "r_x1": 201.3, "r_y1": 439.1, "r_x2": 201.3, "r_y2": 430.3, "r_x3": 134.8, "r_y3": 430.3, "coord_origin": "TOPLEFT" }, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "section_header", "bbox": { "l": 134.8, "t": 462.1, "r": 236.8, "b": 472.7, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 472.7, "r_x1": 141.5, "r_y1": 472.7, "r_x2": 141.5, "r_y2": 462.1, "r_x3": 134.8, "r_y3": 462.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 472.7, "r_x1": 236.8, "r_y1": 472.7, "r_x2": 236.8, "r_y2": 462.1, "r_x3": 154.9, "r_y3": 462.1, "coord_origin": "TOPLEFT" }, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 134.8, "t": 488.7, "r": 484.1, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 497.5, "r_x1": 480.6, "r_y1": 497.5, "r_x2": 480.6, "r_y2": 488.7, "r_x3": 134.8, "r_y3": 488.7, "coord_origin": "TOPLEFT" }, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 509.4, "r_x1": 480.6, "r_y1": 509.4, "r_x2": 480.6, "r_y2": 500.6, "r_x3": 134.8, "r_y3": 500.6, "coord_origin": "TOPLEFT" }, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 521.4, "r_x1": 480.6, "r_y1": 521.4, "r_x2": 480.6, "r_y2": 512.6, "r_x3": 134.8, "r_y3": 512.6, "coord_origin": "TOPLEFT" }, "text": "variety of computer vision methods have been explored to tackle the prob-", "orig": "variety of computer vision methods have been explored to tackle the prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.6, "r_x3": 134.8, "r_y3": 524.6, "coord_origin": "TOPLEFT" }, "text": "lem of table structure recognition, i.e. the correct identification of columns,", "orig": "lem of table structure recognition, i.e. the correct identification of columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "orig": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 484.1, "r_y1": 581.2, "r_x2": 484.1, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 5, "page_no": 2, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 6, "page_no": 2, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 476.0, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.88, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3" }, { "label": "text", "id": 2, "page_no": 2, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 211.4, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 149.7, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 480.6, "r_y1": 151.6, "r_x2": 480.6, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 163.6, "r_x1": 169.6, "r_y1": 163.6, "r_x2": 169.6, "r_y2": 154.8, "r_x3": 134.8, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.9, "r_y0": 163.6, "r_x1": 194.6, "r_y1": 163.6, "r_x2": 194.6, "r_y2": 154.8, "r_x3": 173.9, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.6, "r_y0": 163.6, "r_x1": 480.6, "r_y1": 163.6, "r_x2": 480.6, "r_y2": 154.8, "r_x3": 199.6, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "for the sequence tokenization in Im2Seq models. In this paper,", "orig": "for the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 175.6, "r_x1": 480.6, "r_y1": 175.6, "r_x2": 480.6, "r_y2": 166.8, "r_x3": 134.8, "r_y3": 166.8, "coord_origin": "TOPLEFT" }, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 187.5, "r_x1": 480.6, "r_y1": 187.5, "r_x2": 480.6, "r_y2": 178.7, "r_x3": 134.8, "r_y3": 178.7, "coord_origin": "TOPLEFT" }, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 199.5, "r_x1": 480.6, "r_y1": 199.5, "r_x2": 480.6, "r_y2": 190.7, "r_x3": 134.8, "r_y3": 190.7, "coord_origin": "TOPLEFT" }, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 211.4, "r_x1": 348.4, "r_y1": 211.4, "r_x2": 348.4, "r_y2": 202.6, "r_x3": 134.8, "r_y3": 202.6, "coord_origin": "TOPLEFT" }, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "While the majority of research in TSR is currently focused on the development and application of novel neural model architectures, the table structure representation language (e.g. HTML in PubTabNet and FinTabNet) is usually adopted as is for the sequence tokenization in Im2Seq models. In this paper, we aim for the opposite and investigate the impact of the table structure representation language with an otherwise unmodified Im2Seq transformer-based architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9], we select this model to perform our experiments." }, { "label": "text", "id": 1, "page_no": 2, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 214.8, "r": 480.6, "b": 331.2, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 223.6, "r_x1": 480.6, "r_y1": 223.6, "r_x2": 480.6, "r_y2": 214.8, "r_x3": 149.7, "r_y3": 214.8, "coord_origin": "TOPLEFT" }, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 235.6, "r_x1": 480.6, "r_y1": 235.6, "r_x2": 480.6, "r_y2": 226.8, "r_x3": 134.8, "r_y3": 226.8, "coord_origin": "TOPLEFT" }, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 247.5, "r_x1": 480.6, "r_y1": 247.5, "r_x2": 480.6, "r_y2": 238.7, "r_x3": 134.8, "r_y3": 238.7, "coord_origin": "TOPLEFT" }, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 259.5, "r_x1": 480.6, "r_y1": 259.5, "r_x2": 480.6, "r_y2": 250.7, "r_x3": 134.8, "r_y3": 250.7, "coord_origin": "TOPLEFT" }, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 271.5, "r_x1": 480.6, "r_y1": 271.5, "r_x2": 480.6, "r_y2": 262.7, "r_x3": 134.8, "r_y3": 262.7, "coord_origin": "TOPLEFT" }, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.4, "r_x1": 480.6, "r_y1": 283.4, "r_x2": 480.6, "r_y2": 274.6, "r_x3": 134.8, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 295.4, "r_x1": 480.6, "r_y1": 295.4, "r_x2": 480.6, "r_y2": 286.6, "r_x3": 134.8, "r_y3": 286.6, "coord_origin": "TOPLEFT" }, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 307.3, "r_x1": 480.6, "r_y1": 307.3, "r_x2": 480.6, "r_y2": 298.5, "r_x3": 134.8, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 319.3, "r_x1": 480.6, "r_y1": 319.3, "r_x2": 480.6, "r_y2": 310.5, "r_x3": 134.8, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.2, "r_x1": 179.7, "r_y1": 331.2, "r_x2": 179.7, "r_y2": 322.4, "r_x3": 134.8, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The main contribution of this paper is the introduction of a new optimised table structure language (OTSL), specifically designed to describe table-structure in an compact and structured way for Im2Seq models. OTSL has a number of key features, which make it very attractive to use in Im2Seq models. Specifically, compared to other languages such as HTML, OTSL has a minimized vocabulary which yields short sequence length, strong inherent structure (e.g. strict rectangular layout) and a strict syntax with rules that only look backwards. The latter allows for syntax validation during inference and ensures a syntactically correct table-structure. These OTSL features are illustrated in Figure 1, in comparison to HTML." }, { "label": "text", "id": 0, "page_no": 2, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 334.6, "r": 480.6, "b": 439.1, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 343.4, "r_x1": 480.6, "r_y1": 343.4, "r_x2": 480.6, "r_y2": 334.6, "r_x3": 149.7, "r_y3": 334.6, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 355.4, "r_x1": 480.6, "r_y1": 355.4, "r_x2": 480.6, "r_y2": 346.6, "r_x3": 134.8, "r_y3": 346.6, "coord_origin": "TOPLEFT" }, "text": "latest developments in table-structure reconstruction. In section 3 we review", "orig": "latest developments in table-structure reconstruction. In section 3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 367.4, "r_x1": 480.6, "r_y1": 367.4, "r_x2": 480.6, "r_y2": 358.6, "r_x3": 134.8, "r_y3": 358.6, "coord_origin": "TOPLEFT" }, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 379.3, "r_x1": 480.6, "r_y1": 379.3, "r_x2": 480.6, "r_y2": 370.5, "r_x3": 134.8, "r_y3": 370.5, "coord_origin": "TOPLEFT" }, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 391.3, "r_x1": 480.6, "r_y1": 391.3, "r_x2": 480.6, "r_y2": 382.5, "r_x3": 134.8, "r_y3": 382.5, "coord_origin": "TOPLEFT" }, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 403.2, "r_x1": 480.6, "r_y1": 403.2, "r_x2": 480.6, "r_y2": 394.4, "r_x3": 134.8, "r_y3": 394.4, "coord_origin": "TOPLEFT" }, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 415.2, "r_x1": 480.6, "r_y1": 415.2, "r_x2": 480.6, "r_y2": 406.4, "r_x3": 134.8, "r_y3": 406.4, "coord_origin": "TOPLEFT" }, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 427.1, "r_x1": 480.6, "r_y1": 427.1, "r_x2": 480.6, "r_y2": 418.3, "r_x3": 134.8, "r_y3": 418.3, "coord_origin": "TOPLEFT" }, "text": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "orig": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 439.1, "r_x1": 201.3, "r_y1": 439.1, "r_x2": 201.3, "r_y2": 430.3, "r_x3": 134.8, "r_y3": 430.3, "coord_origin": "TOPLEFT" }, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The paper is structured as follows. In section 2, we give an overview of the latest developments in table-structure reconstruction. In section 3 we review the current HTML table encoding (popularised by PubTabNet and FinTabNet) and discuss its flaws. Subsequently, we introduce OTSL in section 4, which includes the language definition, syntax rules and error-correction procedures. In section 5, we apply OTSL on the TableFormer architecture, compare it to TableFormer models trained on HTML and ultimately demonstrate the advantages of using OTSL. Finally, in section 6 we conclude our work and outline next potential steps." }, { "label": "section_header", "id": 4, "page_no": 2, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 134.8, "t": 462.1, "r": 236.8, "b": 472.7, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 472.7, "r_x1": 141.5, "r_y1": 472.7, "r_x2": 141.5, "r_y2": 462.1, "r_x3": 134.8, "r_y3": 462.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 472.7, "r_x1": 236.8, "r_y1": 472.7, "r_x2": 236.8, "r_y2": 462.1, "r_x3": 154.9, "r_y3": 462.1, "coord_origin": "TOPLEFT" }, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2 Related Work" }, { "label": "text", "id": 3, "page_no": 2, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.8, "t": 488.7, "r": 484.1, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 497.5, "r_x1": 480.6, "r_y1": 497.5, "r_x2": 480.6, "r_y2": 488.7, "r_x3": 134.8, "r_y3": 488.7, "coord_origin": "TOPLEFT" }, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 509.4, "r_x1": 480.6, "r_y1": 509.4, "r_x2": 480.6, "r_y2": 500.6, "r_x3": 134.8, "r_y3": 500.6, "coord_origin": "TOPLEFT" }, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 521.4, "r_x1": 480.6, "r_y1": 521.4, "r_x2": 480.6, "r_y2": 512.6, "r_x3": 134.8, "r_y3": 512.6, "coord_origin": "TOPLEFT" }, "text": "variety of computer vision methods have been explored to tackle the prob-", "orig": "variety of computer vision methods have been explored to tackle the prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.6, "r_x3": 134.8, "r_y3": 524.6, "coord_origin": "TOPLEFT" }, "text": "lem of table structure recognition, i.e. the correct identification of columns,", "orig": "lem of table structure recognition, i.e. the correct identification of columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "orig": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 484.1, "r_y1": 581.2, "r_x2": 484.1, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Approaches to formalize the logical structure and layout of tables in electronic documents date back more than two decades [16]. In the recent past, a wide variety of computer vision methods have been explored to tackle the problem of table structure recognition, i.e. the correct identification of columns, rows and spanning cells in a given table. Broadly speaking, the current deeplearning based approaches fall into three categories: object detection (OD) methods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence (Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on tablestructure annotation using (overlapping) bounding boxes for training, and produce bounding-box predictions to define table cells, rows, and columns on a table image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name suggests, represent tables as graph structures. The graph nodes represent the content of each table cell, an embedding vector from the table image, or geometric coordinates of the table cell. The edges of the graph define the relationship between the nodes, e.g. if they belong to the same column, row, or table cell." } ], "body": [ { "label": "text", "id": 2, "page_no": 2, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 211.4, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 149.7, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 480.6, "r_y1": 151.6, "r_x2": 480.6, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 163.6, "r_x1": 169.6, "r_y1": 163.6, "r_x2": 169.6, "r_y2": 154.8, "r_x3": 134.8, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.9, "r_y0": 163.6, "r_x1": 194.6, "r_y1": 163.6, "r_x2": 194.6, "r_y2": 154.8, "r_x3": 173.9, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.6, "r_y0": 163.6, "r_x1": 480.6, "r_y1": 163.6, "r_x2": 480.6, "r_y2": 154.8, "r_x3": 199.6, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "for the sequence tokenization in Im2Seq models. In this paper,", "orig": "for the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 175.6, "r_x1": 480.6, "r_y1": 175.6, "r_x2": 480.6, "r_y2": 166.8, "r_x3": 134.8, "r_y3": 166.8, "coord_origin": "TOPLEFT" }, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 187.5, "r_x1": 480.6, "r_y1": 187.5, "r_x2": 480.6, "r_y2": 178.7, "r_x3": 134.8, "r_y3": 178.7, "coord_origin": "TOPLEFT" }, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 199.5, "r_x1": 480.6, "r_y1": 199.5, "r_x2": 480.6, "r_y2": 190.7, "r_x3": 134.8, "r_y3": 190.7, "coord_origin": "TOPLEFT" }, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 211.4, "r_x1": 348.4, "r_y1": 211.4, "r_x2": 348.4, "r_y2": 202.6, "r_x3": 134.8, "r_y3": 202.6, "coord_origin": "TOPLEFT" }, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "While the majority of research in TSR is currently focused on the development and application of novel neural model architectures, the table structure representation language (e.g. HTML in PubTabNet and FinTabNet) is usually adopted as is for the sequence tokenization in Im2Seq models. In this paper, we aim for the opposite and investigate the impact of the table structure representation language with an otherwise unmodified Im2Seq transformer-based architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9], we select this model to perform our experiments." }, { "label": "text", "id": 1, "page_no": 2, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 214.8, "r": 480.6, "b": 331.2, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 223.6, "r_x1": 480.6, "r_y1": 223.6, "r_x2": 480.6, "r_y2": 214.8, "r_x3": 149.7, "r_y3": 214.8, "coord_origin": "TOPLEFT" }, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 235.6, "r_x1": 480.6, "r_y1": 235.6, "r_x2": 480.6, "r_y2": 226.8, "r_x3": 134.8, "r_y3": 226.8, "coord_origin": "TOPLEFT" }, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 247.5, "r_x1": 480.6, "r_y1": 247.5, "r_x2": 480.6, "r_y2": 238.7, "r_x3": 134.8, "r_y3": 238.7, "coord_origin": "TOPLEFT" }, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 259.5, "r_x1": 480.6, "r_y1": 259.5, "r_x2": 480.6, "r_y2": 250.7, "r_x3": 134.8, "r_y3": 250.7, "coord_origin": "TOPLEFT" }, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 271.5, "r_x1": 480.6, "r_y1": 271.5, "r_x2": 480.6, "r_y2": 262.7, "r_x3": 134.8, "r_y3": 262.7, "coord_origin": "TOPLEFT" }, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.4, "r_x1": 480.6, "r_y1": 283.4, "r_x2": 480.6, "r_y2": 274.6, "r_x3": 134.8, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 295.4, "r_x1": 480.6, "r_y1": 295.4, "r_x2": 480.6, "r_y2": 286.6, "r_x3": 134.8, "r_y3": 286.6, "coord_origin": "TOPLEFT" }, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 307.3, "r_x1": 480.6, "r_y1": 307.3, "r_x2": 480.6, "r_y2": 298.5, "r_x3": 134.8, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 319.3, "r_x1": 480.6, "r_y1": 319.3, "r_x2": 480.6, "r_y2": 310.5, "r_x3": 134.8, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.2, "r_x1": 179.7, "r_y1": 331.2, "r_x2": 179.7, "r_y2": 322.4, "r_x3": 134.8, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The main contribution of this paper is the introduction of a new optimised table structure language (OTSL), specifically designed to describe table-structure in an compact and structured way for Im2Seq models. OTSL has a number of key features, which make it very attractive to use in Im2Seq models. Specifically, compared to other languages such as HTML, OTSL has a minimized vocabulary which yields short sequence length, strong inherent structure (e.g. strict rectangular layout) and a strict syntax with rules that only look backwards. The latter allows for syntax validation during inference and ensures a syntactically correct table-structure. These OTSL features are illustrated in Figure 1, in comparison to HTML." }, { "label": "text", "id": 0, "page_no": 2, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 334.6, "r": 480.6, "b": 439.1, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 343.4, "r_x1": 480.6, "r_y1": 343.4, "r_x2": 480.6, "r_y2": 334.6, "r_x3": 149.7, "r_y3": 334.6, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 355.4, "r_x1": 480.6, "r_y1": 355.4, "r_x2": 480.6, "r_y2": 346.6, "r_x3": 134.8, "r_y3": 346.6, "coord_origin": "TOPLEFT" }, "text": "latest developments in table-structure reconstruction. In section 3 we review", "orig": "latest developments in table-structure reconstruction. In section 3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 367.4, "r_x1": 480.6, "r_y1": 367.4, "r_x2": 480.6, "r_y2": 358.6, "r_x3": 134.8, "r_y3": 358.6, "coord_origin": "TOPLEFT" }, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 379.3, "r_x1": 480.6, "r_y1": 379.3, "r_x2": 480.6, "r_y2": 370.5, "r_x3": 134.8, "r_y3": 370.5, "coord_origin": "TOPLEFT" }, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 391.3, "r_x1": 480.6, "r_y1": 391.3, "r_x2": 480.6, "r_y2": 382.5, "r_x3": 134.8, "r_y3": 382.5, "coord_origin": "TOPLEFT" }, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 403.2, "r_x1": 480.6, "r_y1": 403.2, "r_x2": 480.6, "r_y2": 394.4, "r_x3": 134.8, "r_y3": 394.4, "coord_origin": "TOPLEFT" }, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 415.2, "r_x1": 480.6, "r_y1": 415.2, "r_x2": 480.6, "r_y2": 406.4, "r_x3": 134.8, "r_y3": 406.4, "coord_origin": "TOPLEFT" }, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 427.1, "r_x1": 480.6, "r_y1": 427.1, "r_x2": 480.6, "r_y2": 418.3, "r_x3": 134.8, "r_y3": 418.3, "coord_origin": "TOPLEFT" }, "text": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "orig": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 439.1, "r_x1": 201.3, "r_y1": 439.1, "r_x2": 201.3, "r_y2": 430.3, "r_x3": 134.8, "r_y3": 430.3, "coord_origin": "TOPLEFT" }, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The paper is structured as follows. In section 2, we give an overview of the latest developments in table-structure reconstruction. In section 3 we review the current HTML table encoding (popularised by PubTabNet and FinTabNet) and discuss its flaws. Subsequently, we introduce OTSL in section 4, which includes the language definition, syntax rules and error-correction procedures. In section 5, we apply OTSL on the TableFormer architecture, compare it to TableFormer models trained on HTML and ultimately demonstrate the advantages of using OTSL. Finally, in section 6 we conclude our work and outline next potential steps." }, { "label": "section_header", "id": 4, "page_no": 2, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 134.8, "t": 462.1, "r": 236.8, "b": 472.7, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 472.7, "r_x1": 141.5, "r_y1": 472.7, "r_x2": 141.5, "r_y2": 462.1, "r_x3": 134.8, "r_y3": 462.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 472.7, "r_x1": 236.8, "r_y1": 472.7, "r_x2": 236.8, "r_y2": 462.1, "r_x3": 154.9, "r_y3": 462.1, "coord_origin": "TOPLEFT" }, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2 Related Work" }, { "label": "text", "id": 3, "page_no": 2, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.8, "t": 488.7, "r": 484.1, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 497.5, "r_x1": 480.6, "r_y1": 497.5, "r_x2": 480.6, "r_y2": 488.7, "r_x3": 134.8, "r_y3": 488.7, "coord_origin": "TOPLEFT" }, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 509.4, "r_x1": 480.6, "r_y1": 509.4, "r_x2": 480.6, "r_y2": 500.6, "r_x3": 134.8, "r_y3": 500.6, "coord_origin": "TOPLEFT" }, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 521.4, "r_x1": 480.6, "r_y1": 521.4, "r_x2": 480.6, "r_y2": 512.6, "r_x3": 134.8, "r_y3": 512.6, "coord_origin": "TOPLEFT" }, "text": "variety of computer vision methods have been explored to tackle the prob-", "orig": "variety of computer vision methods have been explored to tackle the prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.6, "r_x3": 134.8, "r_y3": 524.6, "coord_origin": "TOPLEFT" }, "text": "lem of table structure recognition, i.e. the correct identification of columns,", "orig": "lem of table structure recognition, i.e. the correct identification of columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "orig": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 484.1, "r_y1": 581.2, "r_x2": 484.1, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Approaches to formalize the logical structure and layout of tables in electronic documents date back more than two decades [16]. In the recent past, a wide variety of computer vision methods have been explored to tackle the problem of table structure recognition, i.e. the correct identification of columns, rows and spanning cells in a given table. Broadly speaking, the current deeplearning based approaches fall into three categories: object detection (OD) methods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence (Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on tablestructure annotation using (overlapping) bounding boxes for training, and produce bounding-box predictions to define table cells, rows, and columns on a table image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name suggests, represent tables as graph structures. The graph nodes represent the content of each table cell, an embedding vector from the table image, or geometric coordinates of the table cell. The edges of the graph define the relationship between the nodes, e.g. if they belong to the same column, row, or table cell." } ], "headers": [ { "label": "page_header", "id": 5, "page_no": 2, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 6, "page_no": 2, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 476.0, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.88, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3" } ] } }, { "page_no": 3, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 480.6, "r_y1": 151.6, "r_x2": 480.6, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 163.6, "r_x1": 480.6, "r_y1": 163.6, "r_x2": 480.6, "r_y2": 154.8, "r_x3": 134.8, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "structure representation language, which is often implemented with standard", "orig": "structure representation language, which is often implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 175.6, "r_x1": 480.6, "r_y1": 175.6, "r_x2": 480.6, "r_y2": 166.8, "r_x3": 134.8, "r_y3": 166.8, "coord_origin": "TOPLEFT" }, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 187.5, "r_x1": 480.6, "r_y1": 187.5, "r_x2": 480.6, "r_y2": 178.7, "r_x3": 134.8, "r_y3": 178.7, "coord_origin": "TOPLEFT" }, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 199.5, "r_x1": 480.6, "r_y1": 199.5, "r_x2": 480.6, "r_y2": 190.7, "r_x3": 134.8, "r_y3": 190.7, "coord_origin": "TOPLEFT" }, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 211.4, "r_x1": 480.6, "r_y1": 211.4, "r_x2": 480.6, "r_y2": 202.6, "r_x3": 134.8, "r_y3": 202.6, "coord_origin": "TOPLEFT" }, "text": "in order to obtain the table-structure, which is necessary with OD and GNN", "orig": "in order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 223.4, "r_x1": 480.6, "r_y1": 223.4, "r_x2": 480.6, "r_y2": 214.6, "r_x3": 134.8, "r_y3": 214.6, "coord_origin": "TOPLEFT" }, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 235.3, "r_x1": 480.6, "r_y1": 235.3, "r_x2": 480.6, "r_y2": 226.5, "r_x3": 134.8, "r_y3": 226.5, "coord_origin": "TOPLEFT" }, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 247.3, "r_x1": 480.6, "r_y1": 247.3, "r_x2": 480.6, "r_y2": 238.5, "r_x3": 134.8, "r_y3": 238.5, "coord_origin": "TOPLEFT" }, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 259.2, "r_x1": 480.6, "r_y1": 259.2, "r_x2": 480.6, "r_y2": 250.4, "r_x3": 134.8, "r_y3": 250.4, "coord_origin": "TOPLEFT" }, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 271.5, "r_x1": 480.6, "r_y1": 271.5, "r_x2": 480.6, "r_y2": 262.7, "r_x3": 149.7, "r_y3": 262.7, "coord_origin": "TOPLEFT" }, "text": "Within the Im2Seq method, we find several popular models, namely the", "orig": "Within the Im2Seq method, we find several popular models, namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.4, "r_x1": 480.6, "r_y1": 283.4, "r_x2": 480.6, "r_y2": 274.6, "r_x3": 134.8, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 295.4, "r_x1": 480.6, "r_y1": 295.4, "r_x2": 480.6, "r_y2": 286.6, "r_x3": 134.8, "r_y3": 286.6, "coord_origin": "TOPLEFT" }, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 307.3, "r_x1": 342.0, "r_y1": 307.3, "r_x2": 342.0, "r_y2": 298.5, "r_x3": 134.8, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.1, "r_y0": 307.3, "r_x1": 393.0, "r_y1": 307.3, "r_x2": 393.0, "r_y2": 298.5, "r_x3": 345.1, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.2, "r_y0": 307.3, "r_x1": 480.6, "r_y1": 307.3, "r_x2": 480.6, "r_y2": 298.5, "r_x3": 397.2, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 319.3, "r_x1": 333.3, "r_y1": 319.3, "r_x2": 333.3, "r_y2": 310.5, "r_x3": 134.8, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.3, "r_y0": 319.3, "r_x1": 357.0, "r_y1": 319.3, "r_x2": 357.0, "r_y2": 310.5, "r_x3": 333.3, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.1, "r_y0": 319.3, "r_x1": 480.6, "r_y1": 319.3, "r_x2": 480.6, "r_y2": 310.5, "r_x3": 357.1, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "), the attention is passed to", "orig": "), the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.2, "r_x1": 148.6, "r_y1": 331.2, "r_x2": 148.6, "r_y2": 322.4, "r_x3": 134.8, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.3, "r_y0": 331.2, "r_x1": 202.1, "r_y1": 331.2, "r_x2": 202.1, "r_y2": 322.4, "r_x3": 152.3, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "cell decoder", "orig": "cell decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.9, "r_y0": 331.2, "r_x1": 480.6, "r_y1": 331.2, "r_x2": 480.6, "r_y2": 322.4, "r_x3": 206.9, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 343.2, "r_x1": 480.6, "r_y1": 343.2, "r_x2": 480.6, "r_y2": 334.4, "r_x3": 134.8, "r_y3": 334.4, "coord_origin": "TOPLEFT" }, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 355.1, "r_x1": 480.6, "r_y1": 355.1, "r_x2": 480.6, "r_y2": 346.3, "r_x3": 134.8, "r_y3": 346.3, "coord_origin": "TOPLEFT" }, "text": "TableFormer address this reliance on OCR and uses two transformer decoders for", "orig": "TableFormer address this reliance on OCR and uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 367.1, "r_x1": 480.6, "r_y1": 367.1, "r_x2": 480.6, "r_y2": 358.3, "r_x3": 134.8, "r_y3": 358.3, "coord_origin": "TOPLEFT" }, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 379.0, "r_x1": 480.6, "r_y1": 379.0, "r_x2": 480.6, "r_y2": 370.3, "r_x3": 134.8, "r_y3": 370.3, "coord_origin": "TOPLEFT" }, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 391.0, "r_x1": 480.6, "r_y1": 391.0, "r_x2": 480.6, "r_y2": 382.2, "r_x3": 134.8, "r_y3": 382.2, "coord_origin": "TOPLEFT" }, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 403.0, "r_x1": 144.8, "r_y1": 403.0, "r_x2": 144.8, "r_y2": 394.2, "r_x3": 134.8, "r_y3": 394.2, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.5, "r_y0": 403.0, "r_x1": 480.6, "r_y1": 403.0, "r_x2": 480.6, "r_y2": 394.2, "r_x3": 149.5, "r_y3": 394.2, "coord_origin": "TOPLEFT" }, "text": "proposes a compact double-matrix representation of table rows and columns", "orig": "proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 414.9, "r_x1": 480.6, "r_y1": 414.9, "r_x2": 480.6, "r_y2": 406.1, "r_x3": 134.8, "r_y3": 406.1, "coord_origin": "TOPLEFT" }, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 426.9, "r_x1": 480.6, "r_y1": 426.9, "r_x2": 480.6, "r_y2": 418.1, "r_x3": 134.8, "r_y3": 418.1, "coord_origin": "TOPLEFT" }, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 438.8, "r_x1": 480.6, "r_y1": 438.8, "r_x2": 480.6, "r_y2": 430.0, "r_x3": 134.8, "r_y3": 430.0, "coord_origin": "TOPLEFT" }, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 450.8, "r_x1": 480.6, "r_y1": 450.8, "r_x2": 480.6, "r_y2": 442.0, "r_x3": 134.8, "r_y3": 442.0, "coord_origin": "TOPLEFT" }, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 462.7, "r_x1": 384.6, "r_y1": 462.7, "r_x2": 384.6, "r_y2": 453.9, "r_x3": 134.8, "r_y3": 453.9, "coord_origin": "TOPLEFT" }, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.6, "r_y0": 462.7, "r_x1": 401.7, "r_y1": 462.7, "r_x2": 401.7, "r_y2": 453.9, "r_x3": 391.6, "r_y3": 453.9, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.6, "r_y0": 462.7, "r_x1": 480.6, "r_y1": 462.7, "r_x2": 480.6, "r_y2": 453.9, "r_x3": 406.6, "r_y3": 453.9, "coord_origin": "TOPLEFT" }, "text": "introduces Gated", "orig": "introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 474.7, "r_x1": 480.6, "r_y1": 474.7, "r_x2": 480.6, "r_y2": 465.9, "r_x3": 134.8, "r_y3": 465.9, "coord_origin": "TOPLEFT" }, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 486.6, "r_x1": 203.7, "r_y1": 486.6, "r_x2": 203.7, "r_y2": 477.8, "r_x3": 134.8, "r_y3": 477.8, "coord_origin": "TOPLEFT" }, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 498.9, "r_x1": 480.6, "r_y1": 498.9, "r_x2": 480.6, "r_y2": 490.1, "r_x3": 149.7, "r_y3": 490.1, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 510.8, "r_x1": 480.6, "r_y1": 510.8, "r_x2": 480.6, "r_y2": 502.0, "r_x3": 134.8, "r_y3": 502.0, "coord_origin": "TOPLEFT" }, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 522.8, "r_x1": 480.6, "r_y1": 522.8, "r_x2": 480.6, "r_y2": 514.0, "r_x3": 134.8, "r_y3": 514.0, "coord_origin": "TOPLEFT" }, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 534.7, "r_x1": 480.6, "r_y1": 534.7, "r_x2": 480.6, "r_y2": 525.9, "r_x3": 134.8, "r_y3": 525.9, "coord_origin": "TOPLEFT" }, "text": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "orig": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 546.7, "r_x1": 480.6, "r_y1": 546.7, "r_x2": 480.6, "r_y2": 537.9, "r_x3": 134.8, "r_y3": 537.9, "coord_origin": "TOPLEFT" }, "text": "to investigate if the performance (both in accuracy and inference time) can", "orig": "to investigate if the performance (both in accuracy and inference time) can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 558.6, "r_x1": 480.6, "r_y1": 558.6, "r_x2": 480.6, "r_y2": 549.8, "r_x3": 134.8, "r_y3": 549.8, "coord_origin": "TOPLEFT" }, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 570.6, "r_x1": 480.6, "r_y1": 570.6, "r_x2": 480.6, "r_y2": 561.8, "r_x3": 134.8, "r_y3": 561.8, "coord_origin": "TOPLEFT" }, "text": "We believe this is a necessary step before further improving neural network", "orig": "We believe this is a necessary step before further improving neural network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 582.5, "r_x1": 249.3, "r_y1": 582.5, "r_x2": 249.3, "r_y2": 573.8, "r_x3": 134.8, "r_y3": 573.8, "coord_origin": "TOPLEFT" }, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 616.1, "r_x1": 141.5, "r_y1": 616.1, "r_x2": 141.5, "r_y2": 605.5, "r_x3": 134.8, "r_y3": 605.5, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 616.1, "r_x1": 269.6, "r_y1": 616.1, "r_x2": 269.6, "r_y2": 605.5, "r_x3": 154.9, "r_y3": 605.5, "coord_origin": "TOPLEFT" }, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 6, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 139.4, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.79, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.9, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 259.2, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 480.6, "r_y1": 151.6, "r_x2": 480.6, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 163.6, "r_x1": 480.6, "r_y1": 163.6, "r_x2": 480.6, "r_y2": 154.8, "r_x3": 134.8, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "structure representation language, which is often implemented with standard", "orig": "structure representation language, which is often implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 175.6, "r_x1": 480.6, "r_y1": 175.6, "r_x2": 480.6, "r_y2": 166.8, "r_x3": 134.8, "r_y3": 166.8, "coord_origin": "TOPLEFT" }, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 187.5, "r_x1": 480.6, "r_y1": 187.5, "r_x2": 480.6, "r_y2": 178.7, "r_x3": 134.8, "r_y3": 178.7, "coord_origin": "TOPLEFT" }, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 199.5, "r_x1": 480.6, "r_y1": 199.5, "r_x2": 480.6, "r_y2": 190.7, "r_x3": 134.8, "r_y3": 190.7, "coord_origin": "TOPLEFT" }, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 211.4, "r_x1": 480.6, "r_y1": 211.4, "r_x2": 480.6, "r_y2": 202.6, "r_x3": 134.8, "r_y3": 202.6, "coord_origin": "TOPLEFT" }, "text": "in order to obtain the table-structure, which is necessary with OD and GNN", "orig": "in order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 223.4, "r_x1": 480.6, "r_y1": 223.4, "r_x2": 480.6, "r_y2": 214.6, "r_x3": 134.8, "r_y3": 214.6, "coord_origin": "TOPLEFT" }, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 235.3, "r_x1": 480.6, "r_y1": 235.3, "r_x2": 480.6, "r_y2": 226.5, "r_x3": 134.8, "r_y3": 226.5, "coord_origin": "TOPLEFT" }, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 247.3, "r_x1": 480.6, "r_y1": 247.3, "r_x2": 480.6, "r_y2": 238.5, "r_x3": 134.8, "r_y3": 238.5, "coord_origin": "TOPLEFT" }, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 259.2, "r_x1": 480.6, "r_y1": 259.2, "r_x2": 480.6, "r_y2": 250.4, "r_x3": 134.8, "r_y3": 250.4, "coord_origin": "TOPLEFT" }, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 134.8, "t": 262.7, "r": 480.6, "b": 486.6, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 271.5, "r_x1": 480.6, "r_y1": 271.5, "r_x2": 480.6, "r_y2": 262.7, "r_x3": 149.7, "r_y3": 262.7, "coord_origin": "TOPLEFT" }, "text": "Within the Im2Seq method, we find several popular models, namely the", "orig": "Within the Im2Seq method, we find several popular models, namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.4, "r_x1": 480.6, "r_y1": 283.4, "r_x2": 480.6, "r_y2": 274.6, "r_x3": 134.8, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 295.4, "r_x1": 480.6, "r_y1": 295.4, "r_x2": 480.6, "r_y2": 286.6, "r_x3": 134.8, "r_y3": 286.6, "coord_origin": "TOPLEFT" }, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 307.3, "r_x1": 342.0, "r_y1": 307.3, "r_x2": 342.0, "r_y2": 298.5, "r_x3": 134.8, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.1, "r_y0": 307.3, "r_x1": 393.0, "r_y1": 307.3, "r_x2": 393.0, "r_y2": 298.5, "r_x3": 345.1, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.2, "r_y0": 307.3, "r_x1": 480.6, "r_y1": 307.3, "r_x2": 480.6, "r_y2": 298.5, "r_x3": 397.2, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 319.3, "r_x1": 333.3, "r_y1": 319.3, "r_x2": 333.3, "r_y2": 310.5, "r_x3": 134.8, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.3, "r_y0": 319.3, "r_x1": 357.0, "r_y1": 319.3, "r_x2": 357.0, "r_y2": 310.5, "r_x3": 333.3, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.1, "r_y0": 319.3, "r_x1": 480.6, "r_y1": 319.3, "r_x2": 480.6, "r_y2": 310.5, "r_x3": 357.1, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "), the attention is passed to", "orig": "), the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.2, "r_x1": 148.6, "r_y1": 331.2, "r_x2": 148.6, "r_y2": 322.4, "r_x3": 134.8, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.3, "r_y0": 331.2, "r_x1": 202.1, "r_y1": 331.2, "r_x2": 202.1, "r_y2": 322.4, "r_x3": 152.3, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "cell decoder", "orig": "cell decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.9, "r_y0": 331.2, "r_x1": 480.6, "r_y1": 331.2, "r_x2": 480.6, "r_y2": 322.4, "r_x3": 206.9, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 343.2, "r_x1": 480.6, "r_y1": 343.2, "r_x2": 480.6, "r_y2": 334.4, "r_x3": 134.8, "r_y3": 334.4, "coord_origin": "TOPLEFT" }, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 355.1, "r_x1": 480.6, "r_y1": 355.1, "r_x2": 480.6, "r_y2": 346.3, "r_x3": 134.8, "r_y3": 346.3, "coord_origin": "TOPLEFT" }, "text": "TableFormer address this reliance on OCR and uses two transformer decoders for", "orig": "TableFormer address this reliance on OCR and uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 367.1, "r_x1": 480.6, "r_y1": 367.1, "r_x2": 480.6, "r_y2": 358.3, "r_x3": 134.8, "r_y3": 358.3, "coord_origin": "TOPLEFT" }, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 379.0, "r_x1": 480.6, "r_y1": 379.0, "r_x2": 480.6, "r_y2": 370.3, "r_x3": 134.8, "r_y3": 370.3, "coord_origin": "TOPLEFT" }, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 391.0, "r_x1": 480.6, "r_y1": 391.0, "r_x2": 480.6, "r_y2": 382.2, "r_x3": 134.8, "r_y3": 382.2, "coord_origin": "TOPLEFT" }, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 403.0, "r_x1": 144.8, "r_y1": 403.0, "r_x2": 144.8, "r_y2": 394.2, "r_x3": 134.8, "r_y3": 394.2, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.5, "r_y0": 403.0, "r_x1": 480.6, "r_y1": 403.0, "r_x2": 480.6, "r_y2": 394.2, "r_x3": 149.5, "r_y3": 394.2, "coord_origin": "TOPLEFT" }, "text": "proposes a compact double-matrix representation of table rows and columns", "orig": "proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 414.9, "r_x1": 480.6, "r_y1": 414.9, "r_x2": 480.6, "r_y2": 406.1, "r_x3": 134.8, "r_y3": 406.1, "coord_origin": "TOPLEFT" }, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 426.9, "r_x1": 480.6, "r_y1": 426.9, "r_x2": 480.6, "r_y2": 418.1, "r_x3": 134.8, "r_y3": 418.1, "coord_origin": "TOPLEFT" }, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 438.8, "r_x1": 480.6, "r_y1": 438.8, "r_x2": 480.6, "r_y2": 430.0, "r_x3": 134.8, "r_y3": 430.0, "coord_origin": "TOPLEFT" }, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 450.8, "r_x1": 480.6, "r_y1": 450.8, "r_x2": 480.6, "r_y2": 442.0, "r_x3": 134.8, "r_y3": 442.0, "coord_origin": "TOPLEFT" }, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 462.7, "r_x1": 384.6, "r_y1": 462.7, "r_x2": 384.6, "r_y2": 453.9, "r_x3": 134.8, "r_y3": 453.9, "coord_origin": "TOPLEFT" }, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.6, "r_y0": 462.7, "r_x1": 401.7, "r_y1": 462.7, "r_x2": 401.7, "r_y2": 453.9, "r_x3": 391.6, "r_y3": 453.9, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.6, "r_y0": 462.7, "r_x1": 480.6, "r_y1": 462.7, "r_x2": 480.6, "r_y2": 453.9, "r_x3": 406.6, "r_y3": 453.9, "coord_origin": "TOPLEFT" }, "text": "introduces Gated", "orig": "introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 474.7, "r_x1": 480.6, "r_y1": 474.7, "r_x2": 480.6, "r_y2": 465.9, "r_x3": 134.8, "r_y3": 465.9, "coord_origin": "TOPLEFT" }, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 486.6, "r_x1": 203.7, "r_y1": 486.6, "r_x2": 203.7, "r_y2": 477.8, "r_x3": 134.8, "r_y3": 477.8, "coord_origin": "TOPLEFT" }, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 490.1, "r": 480.6, "b": 582.5, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 498.9, "r_x1": 480.6, "r_y1": 498.9, "r_x2": 480.6, "r_y2": 490.1, "r_x3": 149.7, "r_y3": 490.1, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 510.8, "r_x1": 480.6, "r_y1": 510.8, "r_x2": 480.6, "r_y2": 502.0, "r_x3": 134.8, "r_y3": 502.0, "coord_origin": "TOPLEFT" }, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 522.8, "r_x1": 480.6, "r_y1": 522.8, "r_x2": 480.6, "r_y2": 514.0, "r_x3": 134.8, "r_y3": 514.0, "coord_origin": "TOPLEFT" }, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 534.7, "r_x1": 480.6, "r_y1": 534.7, "r_x2": 480.6, "r_y2": 525.9, "r_x3": 134.8, "r_y3": 525.9, "coord_origin": "TOPLEFT" }, "text": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "orig": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 546.7, "r_x1": 480.6, "r_y1": 546.7, "r_x2": 480.6, "r_y2": 537.9, "r_x3": 134.8, "r_y3": 537.9, "coord_origin": "TOPLEFT" }, "text": "to investigate if the performance (both in accuracy and inference time) can", "orig": "to investigate if the performance (both in accuracy and inference time) can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 558.6, "r_x1": 480.6, "r_y1": 558.6, "r_x2": 480.6, "r_y2": 549.8, "r_x3": 134.8, "r_y3": 549.8, "coord_origin": "TOPLEFT" }, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 570.6, "r_x1": 480.6, "r_y1": 570.6, "r_x2": 480.6, "r_y2": 561.8, "r_x3": 134.8, "r_y3": 561.8, "coord_origin": "TOPLEFT" }, "text": "We believe this is a necessary step before further improving neural network", "orig": "We believe this is a necessary step before further improving neural network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 582.5, "r_x1": 249.3, "r_y1": 582.5, "r_x2": 249.3, "r_y2": 573.8, "r_x3": 134.8, "r_y3": 573.8, "coord_origin": "TOPLEFT" }, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "section_header", "bbox": { "l": 134.8, "t": 605.5, "r": 269.6, "b": 616.1, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 616.1, "r_x1": 141.5, "r_y1": 616.1, "r_x2": 141.5, "r_y2": 605.5, "r_x3": 134.8, "r_y3": 605.5, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 616.1, "r_x1": 269.6, "r_y1": 616.1, "r_x2": 269.6, "r_y2": 605.5, "r_x3": 154.9, "r_y3": 605.5, "coord_origin": "TOPLEFT" }, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 632.1, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 6, "page_no": 3, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 139.4, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.79, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4" }, { "label": "page_header", "id": 5, "page_no": 3, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.9, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "text", "id": 2, "page_no": 3, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 259.2, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 480.6, "r_y1": 151.6, "r_x2": 480.6, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 163.6, "r_x1": 480.6, "r_y1": 163.6, "r_x2": 480.6, "r_y2": 154.8, "r_x3": 134.8, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "structure representation language, which is often implemented with standard", "orig": "structure representation language, which is often implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 175.6, "r_x1": 480.6, "r_y1": 175.6, "r_x2": 480.6, "r_y2": 166.8, "r_x3": 134.8, "r_y3": 166.8, "coord_origin": "TOPLEFT" }, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 187.5, "r_x1": 480.6, "r_y1": 187.5, "r_x2": 480.6, "r_y2": 178.7, "r_x3": 134.8, "r_y3": 178.7, "coord_origin": "TOPLEFT" }, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 199.5, "r_x1": 480.6, "r_y1": 199.5, "r_x2": 480.6, "r_y2": 190.7, "r_x3": 134.8, "r_y3": 190.7, "coord_origin": "TOPLEFT" }, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 211.4, "r_x1": 480.6, "r_y1": 211.4, "r_x2": 480.6, "r_y2": 202.6, "r_x3": 134.8, "r_y3": 202.6, "coord_origin": "TOPLEFT" }, "text": "in order to obtain the table-structure, which is necessary with OD and GNN", "orig": "in order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 223.4, "r_x1": 480.6, "r_y1": 223.4, "r_x2": 480.6, "r_y2": 214.6, "r_x3": 134.8, "r_y3": 214.6, "coord_origin": "TOPLEFT" }, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 235.3, "r_x1": 480.6, "r_y1": 235.3, "r_x2": 480.6, "r_y2": 226.5, "r_x3": 134.8, "r_y3": 226.5, "coord_origin": "TOPLEFT" }, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 247.3, "r_x1": 480.6, "r_y1": 247.3, "r_x2": 480.6, "r_y2": 238.5, "r_x3": 134.8, "r_y3": 238.5, "coord_origin": "TOPLEFT" }, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 259.2, "r_x1": 480.6, "r_y1": 259.2, "r_x2": 480.6, "r_y2": 250.4, "r_x3": 134.8, "r_y3": 250.4, "coord_origin": "TOPLEFT" }, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells must be merged using an attention network. Im2Seq methods cast the problem as a sequence generation task [4,5,9,22], and therefore need an internal tablestructure representation language, which is often implemented with standard markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods have a natural advantage over the OD and GNN methods by virtue of directly predicting the table-structure. As such, no post-processing or rules are needed in order to obtain the table-structure, which is necessary with OD and GNN approaches. In practice, this is not entirely true, because a predicted sequence of table-structure markup does not necessarily have to be syntactically correct. Hence, depending on the quality of the predicted sequence, some post-processing needs to be performed to ensure a syntactically valid (let alone correct) sequence." }, { "label": "text", "id": 4, "page_no": 3, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.8, "t": 262.7, "r": 480.6, "b": 486.6, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 271.5, "r_x1": 480.6, "r_y1": 271.5, "r_x2": 480.6, "r_y2": 262.7, "r_x3": 149.7, "r_y3": 262.7, "coord_origin": "TOPLEFT" }, "text": "Within the Im2Seq method, we find several popular models, namely the", "orig": "Within the Im2Seq method, we find several popular models, namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.4, "r_x1": 480.6, "r_y1": 283.4, "r_x2": 480.6, "r_y2": 274.6, "r_x3": 134.8, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 295.4, "r_x1": 480.6, "r_y1": 295.4, "r_x2": 480.6, "r_y2": 286.6, "r_x3": 134.8, "r_y3": 286.6, "coord_origin": "TOPLEFT" }, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 307.3, "r_x1": 342.0, "r_y1": 307.3, "r_x2": 342.0, "r_y2": 298.5, "r_x3": 134.8, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.1, "r_y0": 307.3, "r_x1": 393.0, "r_y1": 307.3, "r_x2": 393.0, "r_y2": 298.5, "r_x3": 345.1, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.2, "r_y0": 307.3, "r_x1": 480.6, "r_y1": 307.3, "r_x2": 480.6, "r_y2": 298.5, "r_x3": 397.2, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 319.3, "r_x1": 333.3, "r_y1": 319.3, "r_x2": 333.3, "r_y2": 310.5, "r_x3": 134.8, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.3, "r_y0": 319.3, "r_x1": 357.0, "r_y1": 319.3, "r_x2": 357.0, "r_y2": 310.5, "r_x3": 333.3, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.1, "r_y0": 319.3, "r_x1": 480.6, "r_y1": 319.3, "r_x2": 480.6, "r_y2": 310.5, "r_x3": 357.1, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "), the attention is passed to", "orig": "), the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.2, "r_x1": 148.6, "r_y1": 331.2, "r_x2": 148.6, "r_y2": 322.4, "r_x3": 134.8, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.3, "r_y0": 331.2, "r_x1": 202.1, "r_y1": 331.2, "r_x2": 202.1, "r_y2": 322.4, "r_x3": 152.3, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "cell decoder", "orig": "cell decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.9, "r_y0": 331.2, "r_x1": 480.6, "r_y1": 331.2, "r_x2": 480.6, "r_y2": 322.4, "r_x3": 206.9, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 343.2, "r_x1": 480.6, "r_y1": 343.2, "r_x2": 480.6, "r_y2": 334.4, "r_x3": 134.8, "r_y3": 334.4, "coord_origin": "TOPLEFT" }, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 355.1, "r_x1": 480.6, "r_y1": 355.1, "r_x2": 480.6, "r_y2": 346.3, "r_x3": 134.8, "r_y3": 346.3, "coord_origin": "TOPLEFT" }, "text": "TableFormer address this reliance on OCR and uses two transformer decoders for", "orig": "TableFormer address this reliance on OCR and uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 367.1, "r_x1": 480.6, "r_y1": 367.1, "r_x2": 480.6, "r_y2": 358.3, "r_x3": 134.8, "r_y3": 358.3, "coord_origin": "TOPLEFT" }, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 379.0, "r_x1": 480.6, "r_y1": 379.0, "r_x2": 480.6, "r_y2": 370.3, "r_x3": 134.8, "r_y3": 370.3, "coord_origin": "TOPLEFT" }, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 391.0, "r_x1": 480.6, "r_y1": 391.0, "r_x2": 480.6, "r_y2": 382.2, "r_x3": 134.8, "r_y3": 382.2, "coord_origin": "TOPLEFT" }, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 403.0, "r_x1": 144.8, "r_y1": 403.0, "r_x2": 144.8, "r_y2": 394.2, "r_x3": 134.8, "r_y3": 394.2, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.5, "r_y0": 403.0, "r_x1": 480.6, "r_y1": 403.0, "r_x2": 480.6, "r_y2": 394.2, "r_x3": 149.5, "r_y3": 394.2, "coord_origin": "TOPLEFT" }, "text": "proposes a compact double-matrix representation of table rows and columns", "orig": "proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 414.9, "r_x1": 480.6, "r_y1": 414.9, "r_x2": 480.6, "r_y2": 406.1, "r_x3": 134.8, "r_y3": 406.1, "coord_origin": "TOPLEFT" }, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 426.9, "r_x1": 480.6, "r_y1": 426.9, "r_x2": 480.6, "r_y2": 418.1, "r_x3": 134.8, "r_y3": 418.1, "coord_origin": "TOPLEFT" }, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 438.8, "r_x1": 480.6, "r_y1": 438.8, "r_x2": 480.6, "r_y2": 430.0, "r_x3": 134.8, "r_y3": 430.0, "coord_origin": "TOPLEFT" }, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 450.8, "r_x1": 480.6, "r_y1": 450.8, "r_x2": 480.6, "r_y2": 442.0, "r_x3": 134.8, "r_y3": 442.0, "coord_origin": "TOPLEFT" }, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 462.7, "r_x1": 384.6, "r_y1": 462.7, "r_x2": 384.6, "r_y2": 453.9, "r_x3": 134.8, "r_y3": 453.9, "coord_origin": "TOPLEFT" }, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.6, "r_y0": 462.7, "r_x1": 401.7, "r_y1": 462.7, "r_x2": 401.7, "r_y2": 453.9, "r_x3": 391.6, "r_y3": 453.9, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.6, "r_y0": 462.7, "r_x1": 480.6, "r_y1": 462.7, "r_x2": 480.6, "r_y2": 453.9, "r_x3": 406.6, "r_y3": 453.9, "coord_origin": "TOPLEFT" }, "text": "introduces Gated", "orig": "introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 474.7, "r_x1": 480.6, "r_y1": 474.7, "r_x2": 480.6, "r_y2": 465.9, "r_x3": 134.8, "r_y3": 465.9, "coord_origin": "TOPLEFT" }, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 486.6, "r_x1": 203.7, "r_y1": 486.6, "r_x2": 203.7, "r_y2": 477.8, "r_x3": 134.8, "r_y3": 477.8, "coord_origin": "TOPLEFT" }, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Within the Im2Seq method, we find several popular models, namely the encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders to predict a table in HTML representation. The tag decoder predicts a sequence of HTML tags. For each decoded table cell ( ), the attention is passed to the cell decoder to predict the content with an embedded OCR approach. The latter makes it susceptible to transcription errors in the cell content of the table. TableFormer address this reliance on OCR and uses two transformer decoders for HTML structure and cell bounding box prediction in an end-to-end architecture. The predicted cell bounding box is then used to extract text tokens from an originating (digital) PDF page, circumventing any need for OCR. TabSplitter [2] proposes a compact double-matrix representation of table rows and columns to do error detection and error correction of HTML structure sequences based on predictions from [19]. This compact double-matrix representation can not be used directly by the Img2seq model training, so the model uses HTML as an intermediate form. Chi et. al. [4] introduce a data set and a baseline method using bidirectional LSTMs to predict LaTeX code. Kayal [5] introduces Gated ResNet transformers to predict LaTeX code, and a separate OCR module to extract content." }, { "label": "text", "id": 0, "page_no": 3, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 490.1, "r": 480.6, "b": 582.5, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 498.9, "r_x1": 480.6, "r_y1": 498.9, "r_x2": 480.6, "r_y2": 490.1, "r_x3": 149.7, "r_y3": 490.1, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 510.8, "r_x1": 480.6, "r_y1": 510.8, "r_x2": 480.6, "r_y2": 502.0, "r_x3": 134.8, "r_y3": 502.0, "coord_origin": "TOPLEFT" }, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 522.8, "r_x1": 480.6, "r_y1": 522.8, "r_x2": 480.6, "r_y2": 514.0, "r_x3": 134.8, "r_y3": 514.0, "coord_origin": "TOPLEFT" }, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 534.7, "r_x1": 480.6, "r_y1": 534.7, "r_x2": 480.6, "r_y2": 525.9, "r_x3": 134.8, "r_y3": 525.9, "coord_origin": "TOPLEFT" }, "text": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "orig": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 546.7, "r_x1": 480.6, "r_y1": 546.7, "r_x2": 480.6, "r_y2": 537.9, "r_x3": 134.8, "r_y3": 537.9, "coord_origin": "TOPLEFT" }, "text": "to investigate if the performance (both in accuracy and inference time) can", "orig": "to investigate if the performance (both in accuracy and inference time) can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 558.6, "r_x1": 480.6, "r_y1": 558.6, "r_x2": 480.6, "r_y2": 549.8, "r_x3": 134.8, "r_y3": 549.8, "coord_origin": "TOPLEFT" }, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 570.6, "r_x1": 480.6, "r_y1": 570.6, "r_x2": 480.6, "r_y2": 561.8, "r_x3": 134.8, "r_y3": 561.8, "coord_origin": "TOPLEFT" }, "text": "We believe this is a necessary step before further improving neural network", "orig": "We believe this is a necessary step before further improving neural network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 582.5, "r_x1": 249.3, "r_y1": 582.5, "r_x2": 249.3, "r_y2": 573.8, "r_x3": 134.8, "r_y3": 573.8, "coord_origin": "TOPLEFT" }, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a full end-to-end network design that can output the final table structure without pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated to deliver state-of-the-art prediction accuracy [9]. This motivated the authors to investigate if the performance (both in accuracy and inference time) can be further improved by optimising the table structure representation language. We believe this is a necessary step before further improving neural network architectures for this task." }, { "label": "section_header", "id": 3, "page_no": 3, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.8, "t": 605.5, "r": 269.6, "b": 616.1, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 616.1, "r_x1": 141.5, "r_y1": 616.1, "r_x2": 141.5, "r_y2": 605.5, "r_x3": 134.8, "r_y3": 605.5, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 616.1, "r_x1": 269.6, "r_y1": 616.1, "r_x2": 269.6, "r_y2": 605.5, "r_x3": 154.9, "r_y3": 605.5, "coord_origin": "TOPLEFT" }, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3 Problem Statement" }, { "label": "text", "id": 1, "page_no": 3, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 632.1, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways. Given an image of a table, the Im2Seq model predicts the structure of the table by generating a sequence of tokens. These tokens originate from a finite vocab-" } ], "body": [ { "label": "text", "id": 2, "page_no": 3, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 259.2, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 480.6, "r_y1": 151.6, "r_x2": 480.6, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 163.6, "r_x1": 480.6, "r_y1": 163.6, "r_x2": 480.6, "r_y2": 154.8, "r_x3": 134.8, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "structure representation language, which is often implemented with standard", "orig": "structure representation language, which is often implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 175.6, "r_x1": 480.6, "r_y1": 175.6, "r_x2": 480.6, "r_y2": 166.8, "r_x3": 134.8, "r_y3": 166.8, "coord_origin": "TOPLEFT" }, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 187.5, "r_x1": 480.6, "r_y1": 187.5, "r_x2": 480.6, "r_y2": 178.7, "r_x3": 134.8, "r_y3": 178.7, "coord_origin": "TOPLEFT" }, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 199.5, "r_x1": 480.6, "r_y1": 199.5, "r_x2": 480.6, "r_y2": 190.7, "r_x3": 134.8, "r_y3": 190.7, "coord_origin": "TOPLEFT" }, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 211.4, "r_x1": 480.6, "r_y1": 211.4, "r_x2": 480.6, "r_y2": 202.6, "r_x3": 134.8, "r_y3": 202.6, "coord_origin": "TOPLEFT" }, "text": "in order to obtain the table-structure, which is necessary with OD and GNN", "orig": "in order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 223.4, "r_x1": 480.6, "r_y1": 223.4, "r_x2": 480.6, "r_y2": 214.6, "r_x3": 134.8, "r_y3": 214.6, "coord_origin": "TOPLEFT" }, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 235.3, "r_x1": 480.6, "r_y1": 235.3, "r_x2": 480.6, "r_y2": 226.5, "r_x3": 134.8, "r_y3": 226.5, "coord_origin": "TOPLEFT" }, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 247.3, "r_x1": 480.6, "r_y1": 247.3, "r_x2": 480.6, "r_y2": 238.5, "r_x3": 134.8, "r_y3": 238.5, "coord_origin": "TOPLEFT" }, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 259.2, "r_x1": 480.6, "r_y1": 259.2, "r_x2": 480.6, "r_y2": 250.4, "r_x3": 134.8, "r_y3": 250.4, "coord_origin": "TOPLEFT" }, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells must be merged using an attention network. Im2Seq methods cast the problem as a sequence generation task [4,5,9,22], and therefore need an internal tablestructure representation language, which is often implemented with standard markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods have a natural advantage over the OD and GNN methods by virtue of directly predicting the table-structure. As such, no post-processing or rules are needed in order to obtain the table-structure, which is necessary with OD and GNN approaches. In practice, this is not entirely true, because a predicted sequence of table-structure markup does not necessarily have to be syntactically correct. Hence, depending on the quality of the predicted sequence, some post-processing needs to be performed to ensure a syntactically valid (let alone correct) sequence." }, { "label": "text", "id": 4, "page_no": 3, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.8, "t": 262.7, "r": 480.6, "b": 486.6, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 271.5, "r_x1": 480.6, "r_y1": 271.5, "r_x2": 480.6, "r_y2": 262.7, "r_x3": 149.7, "r_y3": 262.7, "coord_origin": "TOPLEFT" }, "text": "Within the Im2Seq method, we find several popular models, namely the", "orig": "Within the Im2Seq method, we find several popular models, namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.4, "r_x1": 480.6, "r_y1": 283.4, "r_x2": 480.6, "r_y2": 274.6, "r_x3": 134.8, "r_y3": 274.6, "coord_origin": "TOPLEFT" }, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 295.4, "r_x1": 480.6, "r_y1": 295.4, "r_x2": 480.6, "r_y2": 286.6, "r_x3": 134.8, "r_y3": 286.6, "coord_origin": "TOPLEFT" }, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 307.3, "r_x1": 342.0, "r_y1": 307.3, "r_x2": 342.0, "r_y2": 298.5, "r_x3": 134.8, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.1, "r_y0": 307.3, "r_x1": 393.0, "r_y1": 307.3, "r_x2": 393.0, "r_y2": 298.5, "r_x3": 345.1, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.2, "r_y0": 307.3, "r_x1": 480.6, "r_y1": 307.3, "r_x2": 480.6, "r_y2": 298.5, "r_x3": 397.2, "r_y3": 298.5, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 319.3, "r_x1": 333.3, "r_y1": 319.3, "r_x2": 333.3, "r_y2": 310.5, "r_x3": 134.8, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.3, "r_y0": 319.3, "r_x1": 357.0, "r_y1": 319.3, "r_x2": 357.0, "r_y2": 310.5, "r_x3": 333.3, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.1, "r_y0": 319.3, "r_x1": 480.6, "r_y1": 319.3, "r_x2": 480.6, "r_y2": 310.5, "r_x3": 357.1, "r_y3": 310.5, "coord_origin": "TOPLEFT" }, "text": "), the attention is passed to", "orig": "), the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.2, "r_x1": 148.6, "r_y1": 331.2, "r_x2": 148.6, "r_y2": 322.4, "r_x3": 134.8, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.3, "r_y0": 331.2, "r_x1": 202.1, "r_y1": 331.2, "r_x2": 202.1, "r_y2": 322.4, "r_x3": 152.3, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "cell decoder", "orig": "cell decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.9, "r_y0": 331.2, "r_x1": 480.6, "r_y1": 331.2, "r_x2": 480.6, "r_y2": 322.4, "r_x3": 206.9, "r_y3": 322.4, "coord_origin": "TOPLEFT" }, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 343.2, "r_x1": 480.6, "r_y1": 343.2, "r_x2": 480.6, "r_y2": 334.4, "r_x3": 134.8, "r_y3": 334.4, "coord_origin": "TOPLEFT" }, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 355.1, "r_x1": 480.6, "r_y1": 355.1, "r_x2": 480.6, "r_y2": 346.3, "r_x3": 134.8, "r_y3": 346.3, "coord_origin": "TOPLEFT" }, "text": "TableFormer address this reliance on OCR and uses two transformer decoders for", "orig": "TableFormer address this reliance on OCR and uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 367.1, "r_x1": 480.6, "r_y1": 367.1, "r_x2": 480.6, "r_y2": 358.3, "r_x3": 134.8, "r_y3": 358.3, "coord_origin": "TOPLEFT" }, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 379.0, "r_x1": 480.6, "r_y1": 379.0, "r_x2": 480.6, "r_y2": 370.3, "r_x3": 134.8, "r_y3": 370.3, "coord_origin": "TOPLEFT" }, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 391.0, "r_x1": 480.6, "r_y1": 391.0, "r_x2": 480.6, "r_y2": 382.2, "r_x3": 134.8, "r_y3": 382.2, "coord_origin": "TOPLEFT" }, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 403.0, "r_x1": 144.8, "r_y1": 403.0, "r_x2": 144.8, "r_y2": 394.2, "r_x3": 134.8, "r_y3": 394.2, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.5, "r_y0": 403.0, "r_x1": 480.6, "r_y1": 403.0, "r_x2": 480.6, "r_y2": 394.2, "r_x3": 149.5, "r_y3": 394.2, "coord_origin": "TOPLEFT" }, "text": "proposes a compact double-matrix representation of table rows and columns", "orig": "proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 414.9, "r_x1": 480.6, "r_y1": 414.9, "r_x2": 480.6, "r_y2": 406.1, "r_x3": 134.8, "r_y3": 406.1, "coord_origin": "TOPLEFT" }, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 426.9, "r_x1": 480.6, "r_y1": 426.9, "r_x2": 480.6, "r_y2": 418.1, "r_x3": 134.8, "r_y3": 418.1, "coord_origin": "TOPLEFT" }, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 438.8, "r_x1": 480.6, "r_y1": 438.8, "r_x2": 480.6, "r_y2": 430.0, "r_x3": 134.8, "r_y3": 430.0, "coord_origin": "TOPLEFT" }, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 450.8, "r_x1": 480.6, "r_y1": 450.8, "r_x2": 480.6, "r_y2": 442.0, "r_x3": 134.8, "r_y3": 442.0, "coord_origin": "TOPLEFT" }, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 462.7, "r_x1": 384.6, "r_y1": 462.7, "r_x2": 384.6, "r_y2": 453.9, "r_x3": 134.8, "r_y3": 453.9, "coord_origin": "TOPLEFT" }, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.6, "r_y0": 462.7, "r_x1": 401.7, "r_y1": 462.7, "r_x2": 401.7, "r_y2": 453.9, "r_x3": 391.6, "r_y3": 453.9, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.6, "r_y0": 462.7, "r_x1": 480.6, "r_y1": 462.7, "r_x2": 480.6, "r_y2": 453.9, "r_x3": 406.6, "r_y3": 453.9, "coord_origin": "TOPLEFT" }, "text": "introduces Gated", "orig": "introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 474.7, "r_x1": 480.6, "r_y1": 474.7, "r_x2": 480.6, "r_y2": 465.9, "r_x3": 134.8, "r_y3": 465.9, "coord_origin": "TOPLEFT" }, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 486.6, "r_x1": 203.7, "r_y1": 486.6, "r_x2": 203.7, "r_y2": 477.8, "r_x3": 134.8, "r_y3": 477.8, "coord_origin": "TOPLEFT" }, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Within the Im2Seq method, we find several popular models, namely the encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders to predict a table in HTML representation. The tag decoder predicts a sequence of HTML tags. For each decoded table cell ( ), the attention is passed to the cell decoder to predict the content with an embedded OCR approach. The latter makes it susceptible to transcription errors in the cell content of the table. TableFormer address this reliance on OCR and uses two transformer decoders for HTML structure and cell bounding box prediction in an end-to-end architecture. The predicted cell bounding box is then used to extract text tokens from an originating (digital) PDF page, circumventing any need for OCR. TabSplitter [2] proposes a compact double-matrix representation of table rows and columns to do error detection and error correction of HTML structure sequences based on predictions from [19]. This compact double-matrix representation can not be used directly by the Img2seq model training, so the model uses HTML as an intermediate form. Chi et. al. [4] introduce a data set and a baseline method using bidirectional LSTMs to predict LaTeX code. Kayal [5] introduces Gated ResNet transformers to predict LaTeX code, and a separate OCR module to extract content." }, { "label": "text", "id": 0, "page_no": 3, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 490.1, "r": 480.6, "b": 582.5, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 498.9, "r_x1": 480.6, "r_y1": 498.9, "r_x2": 480.6, "r_y2": 490.1, "r_x3": 149.7, "r_y3": 490.1, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 510.8, "r_x1": 480.6, "r_y1": 510.8, "r_x2": 480.6, "r_y2": 502.0, "r_x3": 134.8, "r_y3": 502.0, "coord_origin": "TOPLEFT" }, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 522.8, "r_x1": 480.6, "r_y1": 522.8, "r_x2": 480.6, "r_y2": 514.0, "r_x3": 134.8, "r_y3": 514.0, "coord_origin": "TOPLEFT" }, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 534.7, "r_x1": 480.6, "r_y1": 534.7, "r_x2": 480.6, "r_y2": 525.9, "r_x3": 134.8, "r_y3": 525.9, "coord_origin": "TOPLEFT" }, "text": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "orig": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 546.7, "r_x1": 480.6, "r_y1": 546.7, "r_x2": 480.6, "r_y2": 537.9, "r_x3": 134.8, "r_y3": 537.9, "coord_origin": "TOPLEFT" }, "text": "to investigate if the performance (both in accuracy and inference time) can", "orig": "to investigate if the performance (both in accuracy and inference time) can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 558.6, "r_x1": 480.6, "r_y1": 558.6, "r_x2": 480.6, "r_y2": 549.8, "r_x3": 134.8, "r_y3": 549.8, "coord_origin": "TOPLEFT" }, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 570.6, "r_x1": 480.6, "r_y1": 570.6, "r_x2": 480.6, "r_y2": 561.8, "r_x3": 134.8, "r_y3": 561.8, "coord_origin": "TOPLEFT" }, "text": "We believe this is a necessary step before further improving neural network", "orig": "We believe this is a necessary step before further improving neural network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 582.5, "r_x1": 249.3, "r_y1": 582.5, "r_x2": 249.3, "r_y2": 573.8, "r_x3": 134.8, "r_y3": 573.8, "coord_origin": "TOPLEFT" }, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a full end-to-end network design that can output the final table structure without pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated to deliver state-of-the-art prediction accuracy [9]. This motivated the authors to investigate if the performance (both in accuracy and inference time) can be further improved by optimising the table structure representation language. We believe this is a necessary step before further improving neural network architectures for this task." }, { "label": "section_header", "id": 3, "page_no": 3, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.8, "t": 605.5, "r": 269.6, "b": 616.1, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 616.1, "r_x1": 141.5, "r_y1": 616.1, "r_x2": 141.5, "r_y2": 605.5, "r_x3": 134.8, "r_y3": 605.5, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 616.1, "r_x1": 269.6, "r_y1": 616.1, "r_x2": 269.6, "r_y2": 605.5, "r_x3": 154.9, "r_y3": 605.5, "coord_origin": "TOPLEFT" }, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3 Problem Statement" }, { "label": "text", "id": 1, "page_no": 3, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 632.1, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways. Given an image of a table, the Im2Seq model predicts the structure of the table by generating a sequence of tokens. These tokens originate from a finite vocab-" } ], "headers": [ { "label": "page_header", "id": 6, "page_no": 3, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 139.4, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.79, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4" }, { "label": "page_header", "id": 5, "page_no": 3, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.9, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 4, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 162.5, "r_y1": 139.7, "r_x2": 162.5, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.4, "r_y0": 139.7, "r_x1": 201.7, "r_y1": 139.7, "r_x2": 201.7, "r_y2": 130.9, "r_x3": 166.4, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.7, "r_y0": 139.7, "r_x1": 204.5, "r_y1": 139.7, "r_x2": 204.5, "r_y2": 130.9, "r_x3": 201.7, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.4, "r_y0": 139.7, "r_x1": 248.9, "r_y1": 139.7, "r_x2": 248.9, "r_y2": 130.9, "r_x3": 208.4, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.9, "r_y0": 139.7, "r_x1": 251.6, "r_y1": 139.7, "r_x2": 251.6, "r_y2": 130.9, "r_x3": 248.9, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.5, "r_y0": 139.7, "r_x1": 278.3, "r_y1": 139.7, "r_x2": 278.3, "r_y2": 130.9, "r_x3": 255.5, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.3, "r_y0": 139.7, "r_x1": 281.1, "r_y1": 139.7, "r_x2": 281.1, "r_y2": 130.9, "r_x3": 278.3, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.9, "r_y0": 139.7, "r_x1": 312.8, "r_y1": 139.7, "r_x2": 312.8, "r_y2": 130.9, "r_x3": 284.9, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.8, "r_y0": 139.7, "r_x1": 315.6, "r_y1": 139.7, "r_x2": 315.6, "r_y2": 130.9, "r_x3": 312.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 319.5, "r_y0": 139.7, "r_x1": 343.1, "r_y1": 139.7, "r_x2": 343.1, "r_y2": 130.9, "r_x3": 319.5, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.1, "r_y0": 139.7, "r_x1": 363.2, "r_y1": 139.7, "r_x2": 363.2, "r_y2": 130.9, "r_x3": 347.1, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.1, "r_y0": 139.7, "r_x1": 395.8, "r_y1": 139.7, "r_x2": 395.8, "r_y2": 130.9, "r_x3": 367.1, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 395.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ", one can construct", "orig": ", one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 480.6, "r_y1": 151.6, "r_x2": 480.6, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 163.6, "r_x1": 480.6, "r_y1": 163.6, "r_x2": 480.6, "r_y2": 154.8, "r_x3": 134.8, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 175.6, "r_x1": 480.6, "r_y1": 175.6, "r_x2": 480.6, "r_y2": 166.8, "r_x3": 134.8, "r_y3": 166.8, "coord_origin": "TOPLEFT" }, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 187.5, "r_x1": 261.9, "r_y1": 187.5, "r_x2": 261.9, "r_y2": 178.7, "r_x3": 134.8, "r_y3": 178.7, "coord_origin": "TOPLEFT" }, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.6, "r_y0": 229.0, "r_x1": 173.5, "r_y1": 229.0, "r_x2": 173.5, "r_y2": 221.1, "r_x3": 145.6, "r_y3": 221.1, "coord_origin": "TOPLEFT" }, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.6, "r_y0": 229.2, "r_x1": 469.8, "r_y1": 229.2, "r_x2": 469.8, "r_y2": 221.1, "r_x3": 176.6, "r_y3": 221.1, "coord_origin": "TOPLEFT" }, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 377.0, "r_x1": 480.6, "r_y1": 377.0, "r_x2": 480.6, "r_y2": 368.2, "r_x3": 149.7, "r_y3": 368.2, "coord_origin": "TOPLEFT" }, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 389.0, "r_x1": 480.6, "r_y1": 389.0, "r_x2": 480.6, "r_y2": 380.2, "r_x3": 134.8, "r_y3": 380.2, "coord_origin": "TOPLEFT" }, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 400.9, "r_x1": 480.6, "r_y1": 400.9, "r_x2": 480.6, "r_y2": 392.1, "r_x3": 134.8, "r_y3": 392.1, "coord_origin": "TOPLEFT" }, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 412.9, "r_x1": 480.6, "r_y1": 412.9, "r_x2": 480.6, "r_y2": 404.1, "r_x3": 134.8, "r_y3": 404.1, "coord_origin": "TOPLEFT" }, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 424.8, "r_x1": 480.6, "r_y1": 424.8, "r_x2": 480.6, "r_y2": 416.0, "r_x3": 134.8, "r_y3": 416.0, "coord_origin": "TOPLEFT" }, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 436.8, "r_x1": 480.6, "r_y1": 436.8, "r_x2": 480.6, "r_y2": 428.0, "r_x3": 134.8, "r_y3": 428.0, "coord_origin": "TOPLEFT" }, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 448.7, "r_x1": 187.9, "r_y1": 448.7, "r_x2": 187.9, "r_y2": 439.9, "r_x3": 134.8, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.9, "r_y0": 448.7, "r_x1": 211.6, "r_y1": 448.7, "r_x2": 211.6, "r_y2": 439.9, "r_x3": 187.9, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.8, "r_y0": 448.7, "r_x1": 230.8, "r_y1": 448.7, "r_x2": 230.8, "r_y2": 439.9, "r_x3": 214.8, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.8, "r_y0": 448.7, "r_x1": 262.6, "r_y1": 448.7, "r_x2": 262.6, "r_y2": 439.9, "r_x3": 233.8, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.7, "r_y0": 448.7, "r_x1": 480.6, "r_y1": 448.7, "r_x2": 480.6, "r_y2": 439.9, "r_x3": 262.7, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 460.7, "r_x1": 480.6, "r_y1": 460.7, "r_x2": 480.6, "r_y2": 451.9, "r_x3": 134.8, "r_y3": 451.9, "coord_origin": "TOPLEFT" }, "text": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "orig": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 472.6, "r_x1": 480.6, "r_y1": 472.6, "r_x2": 480.6, "r_y2": 463.8, "r_x3": 134.8, "r_y3": 463.8, "coord_origin": "TOPLEFT" }, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 484.6, "r_x1": 480.6, "r_y1": 484.6, "r_x2": 480.6, "r_y2": 475.8, "r_x3": 134.8, "r_y3": 475.8, "coord_origin": "TOPLEFT" }, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 496.6, "r_x1": 480.6, "r_y1": 496.6, "r_x2": 480.6, "r_y2": 487.8, "r_x3": 134.8, "r_y3": 487.8, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 508.5, "r_x1": 480.6, "r_y1": 508.5, "r_x2": 480.6, "r_y2": 499.7, "r_x3": 134.8, "r_y3": 499.7, "coord_origin": "TOPLEFT" }, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 520.5, "r_x1": 480.6, "r_y1": 520.5, "r_x2": 480.6, "r_y2": 511.7, "r_x3": 134.8, "r_y3": 511.7, "coord_origin": "TOPLEFT" }, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 532.4, "r_x1": 176.9, "r_y1": 532.4, "r_x2": 176.9, "r_y2": 523.6, "r_x3": 134.8, "r_y3": 523.6, "coord_origin": "TOPLEFT" }, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 544.8, "r_x1": 480.6, "r_y1": 544.8, "r_x2": 480.6, "r_y2": 536.0, "r_x3": 149.7, "r_y3": 536.0, "coord_origin": "TOPLEFT" }, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 556.8, "r_x1": 480.6, "r_y1": 556.8, "r_x2": 480.6, "r_y2": 548.0, "r_x3": 134.8, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 568.7, "r_x1": 480.6, "r_y1": 568.7, "r_x2": 480.6, "r_y2": 560.0, "r_x3": 134.8, "r_y3": 560.0, "coord_origin": "TOPLEFT" }, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 580.7, "r_x1": 452.2, "r_y1": 580.7, "r_x2": 452.2, "r_y2": 571.9, "r_x3": 134.8, "r_y3": 571.9, "coord_origin": "TOPLEFT" }, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 149.7, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "cells, serialised in row-major ordering, where each row and each column have", "orig": "cells, serialised in row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "it is complex to verify the consistency of predicted structures during sequence", "orig": "it is complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 476.0, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.87, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 187.5, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 162.5, "r_y1": 139.7, "r_x2": 162.5, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.4, "r_y0": 139.7, "r_x1": 201.7, "r_y1": 139.7, "r_x2": 201.7, "r_y2": 130.9, "r_x3": 166.4, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.7, "r_y0": 139.7, "r_x1": 204.5, "r_y1": 139.7, "r_x2": 204.5, "r_y2": 130.9, "r_x3": 201.7, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.4, "r_y0": 139.7, "r_x1": 248.9, "r_y1": 139.7, "r_x2": 248.9, "r_y2": 130.9, "r_x3": 208.4, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.9, "r_y0": 139.7, "r_x1": 251.6, "r_y1": 139.7, "r_x2": 251.6, "r_y2": 130.9, "r_x3": 248.9, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.5, "r_y0": 139.7, "r_x1": 278.3, "r_y1": 139.7, "r_x2": 278.3, "r_y2": 130.9, "r_x3": 255.5, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.3, "r_y0": 139.7, "r_x1": 281.1, "r_y1": 139.7, "r_x2": 281.1, "r_y2": 130.9, "r_x3": 278.3, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.9, "r_y0": 139.7, "r_x1": 312.8, "r_y1": 139.7, "r_x2": 312.8, "r_y2": 130.9, "r_x3": 284.9, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.8, "r_y0": 139.7, "r_x1": 315.6, "r_y1": 139.7, "r_x2": 315.6, "r_y2": 130.9, "r_x3": 312.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 319.5, "r_y0": 139.7, "r_x1": 343.1, "r_y1": 139.7, "r_x2": 343.1, "r_y2": 130.9, "r_x3": 319.5, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.1, "r_y0": 139.7, "r_x1": 363.2, "r_y1": 139.7, "r_x2": 363.2, "r_y2": 130.9, "r_x3": 347.1, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.1, "r_y0": 139.7, "r_x1": 395.8, "r_y1": 139.7, "r_x2": 395.8, "r_y2": 130.9, "r_x3": 367.1, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 395.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ", one can construct", "orig": ", one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 480.6, "r_y1": 151.6, "r_x2": 480.6, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 163.6, "r_x1": 480.6, "r_y1": 163.6, "r_x2": 480.6, "r_y2": 154.8, "r_x3": 134.8, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 175.6, "r_x1": 480.6, "r_y1": 175.6, "r_x2": 480.6, "r_y2": 166.8, "r_x3": 134.8, "r_y3": 166.8, "coord_origin": "TOPLEFT" }, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 187.5, "r_x1": 261.9, "r_y1": 187.5, "r_x2": 261.9, "r_y2": 178.7, "r_x3": 134.8, "r_y3": 178.7, "coord_origin": "TOPLEFT" }, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "caption", "bbox": { "l": 145.6, "t": 221.1, "r": 469.8, "b": 229.2, "coord_origin": "TOPLEFT" }, "confidence": 0.85, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.6, "r_y0": 229.0, "r_x1": 173.5, "r_y1": 229.0, "r_x2": 173.5, "r_y2": 221.1, "r_x3": 145.6, "r_y3": 221.1, "coord_origin": "TOPLEFT" }, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.6, "r_y0": 229.2, "r_x1": 469.8, "r_y1": 229.2, "r_x2": 469.8, "r_y2": 221.1, "r_x3": 176.6, "r_y3": 221.1, "coord_origin": "TOPLEFT" }, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 368.2, "r": 480.6, "b": 532.4, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 377.0, "r_x1": 480.6, "r_y1": 377.0, "r_x2": 480.6, "r_y2": 368.2, "r_x3": 149.7, "r_y3": 368.2, "coord_origin": "TOPLEFT" }, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 389.0, "r_x1": 480.6, "r_y1": 389.0, "r_x2": 480.6, "r_y2": 380.2, "r_x3": 134.8, "r_y3": 380.2, "coord_origin": "TOPLEFT" }, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 400.9, "r_x1": 480.6, "r_y1": 400.9, "r_x2": 480.6, "r_y2": 392.1, "r_x3": 134.8, "r_y3": 392.1, "coord_origin": "TOPLEFT" }, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 412.9, "r_x1": 480.6, "r_y1": 412.9, "r_x2": 480.6, "r_y2": 404.1, "r_x3": 134.8, "r_y3": 404.1, "coord_origin": "TOPLEFT" }, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 424.8, "r_x1": 480.6, "r_y1": 424.8, "r_x2": 480.6, "r_y2": 416.0, "r_x3": 134.8, "r_y3": 416.0, "coord_origin": "TOPLEFT" }, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 436.8, "r_x1": 480.6, "r_y1": 436.8, "r_x2": 480.6, "r_y2": 428.0, "r_x3": 134.8, "r_y3": 428.0, "coord_origin": "TOPLEFT" }, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 448.7, "r_x1": 187.9, "r_y1": 448.7, "r_x2": 187.9, "r_y2": 439.9, "r_x3": 134.8, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.9, "r_y0": 448.7, "r_x1": 211.6, "r_y1": 448.7, "r_x2": 211.6, "r_y2": 439.9, "r_x3": 187.9, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.8, "r_y0": 448.7, "r_x1": 230.8, "r_y1": 448.7, "r_x2": 230.8, "r_y2": 439.9, "r_x3": 214.8, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.8, "r_y0": 448.7, "r_x1": 262.6, "r_y1": 448.7, "r_x2": 262.6, "r_y2": 439.9, "r_x3": 233.8, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.7, "r_y0": 448.7, "r_x1": 480.6, "r_y1": 448.7, "r_x2": 480.6, "r_y2": 439.9, "r_x3": 262.7, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 460.7, "r_x1": 480.6, "r_y1": 460.7, "r_x2": 480.6, "r_y2": 451.9, "r_x3": 134.8, "r_y3": 451.9, "coord_origin": "TOPLEFT" }, "text": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "orig": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 472.6, "r_x1": 480.6, "r_y1": 472.6, "r_x2": 480.6, "r_y2": 463.8, "r_x3": 134.8, "r_y3": 463.8, "coord_origin": "TOPLEFT" }, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 484.6, "r_x1": 480.6, "r_y1": 484.6, "r_x2": 480.6, "r_y2": 475.8, "r_x3": 134.8, "r_y3": 475.8, "coord_origin": "TOPLEFT" }, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 496.6, "r_x1": 480.6, "r_y1": 496.6, "r_x2": 480.6, "r_y2": 487.8, "r_x3": 134.8, "r_y3": 487.8, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 508.5, "r_x1": 480.6, "r_y1": 508.5, "r_x2": 480.6, "r_y2": 499.7, "r_x3": 134.8, "r_y3": 499.7, "coord_origin": "TOPLEFT" }, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 520.5, "r_x1": 480.6, "r_y1": 520.5, "r_x2": 480.6, "r_y2": 511.7, "r_x3": 134.8, "r_y3": 511.7, "coord_origin": "TOPLEFT" }, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 532.4, "r_x1": 176.9, "r_y1": 532.4, "r_x2": 176.9, "r_y2": 523.6, "r_x3": 134.8, "r_y3": 523.6, "coord_origin": "TOPLEFT" }, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 134.8, "t": 536.0, "r": 480.6, "b": 580.7, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 544.8, "r_x1": 480.6, "r_y1": 544.8, "r_x2": 480.6, "r_y2": 536.0, "r_x3": 149.7, "r_y3": 536.0, "coord_origin": "TOPLEFT" }, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 556.8, "r_x1": 480.6, "r_y1": 556.8, "r_x2": 480.6, "r_y2": 548.0, "r_x3": 134.8, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 568.7, "r_x1": 480.6, "r_y1": 568.7, "r_x2": 480.6, "r_y2": 560.0, "r_x3": 134.8, "r_y3": 560.0, "coord_origin": "TOPLEFT" }, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 580.7, "r_x1": 452.2, "r_y1": 580.7, "r_x2": 452.2, "r_y2": 571.9, "r_x3": 134.8, "r_y3": 571.9, "coord_origin": "TOPLEFT" }, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 584.3, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 149.7, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "cells, serialised in row-major ordering, where each row and each column have", "orig": "cells, serialised in row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "it is complex to verify the consistency of predicted structures during sequence", "orig": "it is complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "picture", "bbox": { "l": 137.4, "t": 233.5, "r": 476.6, "b": 340.2, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 5, "page_no": 4, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 6, "page_no": 4, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 476.0, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.87, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5" }, { "label": "text", "id": 0, "page_no": 4, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 187.5, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 162.5, "r_y1": 139.7, "r_x2": 162.5, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.4, "r_y0": 139.7, "r_x1": 201.7, "r_y1": 139.7, "r_x2": 201.7, "r_y2": 130.9, "r_x3": 166.4, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.7, "r_y0": 139.7, "r_x1": 204.5, "r_y1": 139.7, "r_x2": 204.5, "r_y2": 130.9, "r_x3": 201.7, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.4, "r_y0": 139.7, "r_x1": 248.9, "r_y1": 139.7, "r_x2": 248.9, "r_y2": 130.9, "r_x3": 208.4, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.9, "r_y0": 139.7, "r_x1": 251.6, "r_y1": 139.7, "r_x2": 251.6, "r_y2": 130.9, "r_x3": 248.9, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.5, "r_y0": 139.7, "r_x1": 278.3, "r_y1": 139.7, "r_x2": 278.3, "r_y2": 130.9, "r_x3": 255.5, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.3, "r_y0": 139.7, "r_x1": 281.1, "r_y1": 139.7, "r_x2": 281.1, "r_y2": 130.9, "r_x3": 278.3, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.9, "r_y0": 139.7, "r_x1": 312.8, "r_y1": 139.7, "r_x2": 312.8, "r_y2": 130.9, "r_x3": 284.9, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.8, "r_y0": 139.7, "r_x1": 315.6, "r_y1": 139.7, "r_x2": 315.6, "r_y2": 130.9, "r_x3": 312.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 319.5, "r_y0": 139.7, "r_x1": 343.1, "r_y1": 139.7, "r_x2": 343.1, "r_y2": 130.9, "r_x3": 319.5, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.1, "r_y0": 139.7, "r_x1": 363.2, "r_y1": 139.7, "r_x2": 363.2, "r_y2": 130.9, "r_x3": 347.1, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.1, "r_y0": 139.7, "r_x1": 395.8, "r_y1": 139.7, "r_x2": 395.8, "r_y2": 130.9, "r_x3": 367.1, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 395.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ", one can construct", "orig": ", one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 480.6, "r_y1": 151.6, "r_x2": 480.6, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 163.6, "r_x1": 480.6, "r_y1": 163.6, "r_x2": 480.6, "r_y2": 154.8, "r_x3": 134.8, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 175.6, "r_x1": 480.6, "r_y1": 175.6, "r_x2": 480.6, "r_y2": 166.8, "r_x3": 134.8, "r_y3": 166.8, "coord_origin": "TOPLEFT" }, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 187.5, "r_x1": 261.9, "r_y1": 187.5, "r_x2": 261.9, "r_y2": 178.7, "r_x3": 134.8, "r_y3": 178.7, "coord_origin": "TOPLEFT" }, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML tokens ,
, , , and , one can construct simple table structures without any spanning cells. In reality though, one needs at least 28 HTML tokens to describe the most common complex tables observed in real-world documents [21,22], due to a variety of spanning cells definitions in the HTML token vocabulary." }, { "label": "caption", "id": 7, "page_no": 4, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 145.6, "t": 221.1, "r": 469.8, "b": 229.2, "coord_origin": "TOPLEFT" }, "confidence": 0.85, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.6, "r_y0": 229.0, "r_x1": 173.5, "r_y1": 229.0, "r_x2": 173.5, "r_y2": 221.1, "r_x3": 145.6, "r_y3": 221.1, "coord_origin": "TOPLEFT" }, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.6, "r_y0": 229.2, "r_x1": 469.8, "r_y1": 229.2, "r_x2": 469.8, "r_y2": 221.1, "r_x3": 176.6, "r_y3": 221.1, "coord_origin": "TOPLEFT" }, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 2. Frequency of tokens in HTML and OTSL as they appear in PubTabNet." }, { "label": "text", "id": 1, "page_no": 4, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 368.2, "r": 480.6, "b": 532.4, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 377.0, "r_x1": 480.6, "r_y1": 377.0, "r_x2": 480.6, "r_y2": 368.2, "r_x3": 149.7, "r_y3": 368.2, "coord_origin": "TOPLEFT" }, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 389.0, "r_x1": 480.6, "r_y1": 389.0, "r_x2": 480.6, "r_y2": 380.2, "r_x3": 134.8, "r_y3": 380.2, "coord_origin": "TOPLEFT" }, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 400.9, "r_x1": 480.6, "r_y1": 400.9, "r_x2": 480.6, "r_y2": 392.1, "r_x3": 134.8, "r_y3": 392.1, "coord_origin": "TOPLEFT" }, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 412.9, "r_x1": 480.6, "r_y1": 412.9, "r_x2": 480.6, "r_y2": 404.1, "r_x3": 134.8, "r_y3": 404.1, "coord_origin": "TOPLEFT" }, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 424.8, "r_x1": 480.6, "r_y1": 424.8, "r_x2": 480.6, "r_y2": 416.0, "r_x3": 134.8, "r_y3": 416.0, "coord_origin": "TOPLEFT" }, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 436.8, "r_x1": 480.6, "r_y1": 436.8, "r_x2": 480.6, "r_y2": 428.0, "r_x3": 134.8, "r_y3": 428.0, "coord_origin": "TOPLEFT" }, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 448.7, "r_x1": 187.9, "r_y1": 448.7, "r_x2": 187.9, "r_y2": 439.9, "r_x3": 134.8, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.9, "r_y0": 448.7, "r_x1": 211.6, "r_y1": 448.7, "r_x2": 211.6, "r_y2": 439.9, "r_x3": 187.9, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.8, "r_y0": 448.7, "r_x1": 230.8, "r_y1": 448.7, "r_x2": 230.8, "r_y2": 439.9, "r_x3": 214.8, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.8, "r_y0": 448.7, "r_x1": 262.6, "r_y1": 448.7, "r_x2": 262.6, "r_y2": 439.9, "r_x3": 233.8, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.7, "r_y0": 448.7, "r_x1": 480.6, "r_y1": 448.7, "r_x2": 480.6, "r_y2": 439.9, "r_x3": 262.7, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 460.7, "r_x1": 480.6, "r_y1": 460.7, "r_x2": 480.6, "r_y2": 451.9, "r_x3": 134.8, "r_y3": 451.9, "coord_origin": "TOPLEFT" }, "text": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "orig": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 472.6, "r_x1": 480.6, "r_y1": 472.6, "r_x2": 480.6, "r_y2": 463.8, "r_x3": 134.8, "r_y3": 463.8, "coord_origin": "TOPLEFT" }, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 484.6, "r_x1": 480.6, "r_y1": 484.6, "r_x2": 480.6, "r_y2": 475.8, "r_x3": 134.8, "r_y3": 475.8, "coord_origin": "TOPLEFT" }, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 496.6, "r_x1": 480.6, "r_y1": 496.6, "r_x2": 480.6, "r_y2": 487.8, "r_x3": 134.8, "r_y3": 487.8, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 508.5, "r_x1": 480.6, "r_y1": 508.5, "r_x2": 480.6, "r_y2": 499.7, "r_x3": 134.8, "r_y3": 499.7, "coord_origin": "TOPLEFT" }, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 520.5, "r_x1": 480.6, "r_y1": 520.5, "r_x2": 480.6, "r_y2": 511.7, "r_x3": 134.8, "r_y3": 511.7, "coord_origin": "TOPLEFT" }, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 532.4, "r_x1": 176.9, "r_y1": 532.4, "r_x2": 176.9, "r_y2": 523.6, "r_x3": 134.8, "r_y3": 523.6, "coord_origin": "TOPLEFT" }, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Obviously, HTML and other general-purpose markup languages were not designed for Im2Seq models. As such, they have some serious drawbacks. First, the token vocabulary needs to be artificially large in order to describe all plausible tabular structures. Since most Im2Seq models use an autoregressive approach, they generate the sequence token by token. Therefore, to reduce inference time, a shorter sequence length is critical. Every table-cell is represented by at least two tokens ( and ). Furthermore, when tokenizing the HTML structure, one needs to explicitly enumerate possible column-spans and row-spans as words. In practice, this ends up requiring 28 different HTML tokens (when including column- and row-spans up to 10 cells) just to describe every table in the PubTabNet dataset. Clearly, not every token is equally represented, as is depicted in Figure 2. This skewed distribution of tokens in combination with variable token row-length makes it challenging for models to learn the HTML structure." }, { "label": "text", "id": 3, "page_no": 4, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.8, "t": 536.0, "r": 480.6, "b": 580.7, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 544.8, "r_x1": 480.6, "r_y1": 544.8, "r_x2": 480.6, "r_y2": 536.0, "r_x3": 149.7, "r_y3": 536.0, "coord_origin": "TOPLEFT" }, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 556.8, "r_x1": 480.6, "r_y1": 556.8, "r_x2": 480.6, "r_y2": 548.0, "r_x3": 134.8, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 568.7, "r_x1": 480.6, "r_y1": 568.7, "r_x2": 480.6, "r_y2": 560.0, "r_x3": 134.8, "r_y3": 560.0, "coord_origin": "TOPLEFT" }, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 580.7, "r_x1": 452.2, "r_y1": 580.7, "r_x2": 452.2, "r_y2": 571.9, "r_x3": 134.8, "r_y3": 571.9, "coord_origin": "TOPLEFT" }, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Additionally, it would be desirable if the representation would easily allow an early detection of invalid sequences on-the-go, before the prediction of the entire table structure is completed. HTML is not well-suited for this purpose as the verification of incomplete sequences is non-trivial or even impossible." }, { "label": "text", "id": 2, "page_no": 4, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 584.3, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 149.7, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "cells, serialised in row-major ordering, where each row and each column have", "orig": "cells, serialised in row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "it is complex to verify the consistency of predicted structures during sequence", "orig": "it is complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table cells, serialised in row-major ordering, where each row and each column have the same length (while considering row- and column-spans). Furthermore, every opening tag in HTML needs to be matched by a closing tag in a correct hierarchical manner. Since the number of tokens for each table row and column can vary significantly, especially for large tables with many row- and column-spans, it is complex to verify the consistency of predicted structures during sequence" }, { "label": "picture", "id": 4, "page_no": 4, "cluster": { "id": 4, "label": "picture", "bbox": { "l": 137.4, "t": 233.5, "r": 476.6, "b": 340.2, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "body": [ { "label": "text", "id": 0, "page_no": 4, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 187.5, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 162.5, "r_y1": 139.7, "r_x2": 162.5, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.4, "r_y0": 139.7, "r_x1": 201.7, "r_y1": 139.7, "r_x2": 201.7, "r_y2": 130.9, "r_x3": 166.4, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.7, "r_y0": 139.7, "r_x1": 204.5, "r_y1": 139.7, "r_x2": 204.5, "r_y2": 130.9, "r_x3": 201.7, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.4, "r_y0": 139.7, "r_x1": 248.9, "r_y1": 139.7, "r_x2": 248.9, "r_y2": 130.9, "r_x3": 208.4, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.9, "r_y0": 139.7, "r_x1": 251.6, "r_y1": 139.7, "r_x2": 251.6, "r_y2": 130.9, "r_x3": 248.9, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.5, "r_y0": 139.7, "r_x1": 278.3, "r_y1": 139.7, "r_x2": 278.3, "r_y2": 130.9, "r_x3": 255.5, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.3, "r_y0": 139.7, "r_x1": 281.1, "r_y1": 139.7, "r_x2": 281.1, "r_y2": 130.9, "r_x3": 278.3, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.9, "r_y0": 139.7, "r_x1": 312.8, "r_y1": 139.7, "r_x2": 312.8, "r_y2": 130.9, "r_x3": 284.9, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.8, "r_y0": 139.7, "r_x1": 315.6, "r_y1": 139.7, "r_x2": 315.6, "r_y2": 130.9, "r_x3": 312.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 319.5, "r_y0": 139.7, "r_x1": 343.1, "r_y1": 139.7, "r_x2": 343.1, "r_y2": 130.9, "r_x3": 319.5, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.1, "r_y0": 139.7, "r_x1": 363.2, "r_y1": 139.7, "r_x2": 363.2, "r_y2": 130.9, "r_x3": 347.1, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.1, "r_y0": 139.7, "r_x1": 395.8, "r_y1": 139.7, "r_x2": 395.8, "r_y2": 130.9, "r_x3": 367.1, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 395.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": ", one can construct", "orig": ", one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 480.6, "r_y1": 151.6, "r_x2": 480.6, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 163.6, "r_x1": 480.6, "r_y1": 163.6, "r_x2": 480.6, "r_y2": 154.8, "r_x3": 134.8, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 175.6, "r_x1": 480.6, "r_y1": 175.6, "r_x2": 480.6, "r_y2": 166.8, "r_x3": 134.8, "r_y3": 166.8, "coord_origin": "TOPLEFT" }, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 187.5, "r_x1": 261.9, "r_y1": 187.5, "r_x2": 261.9, "r_y2": 178.7, "r_x3": 134.8, "r_y3": 178.7, "coord_origin": "TOPLEFT" }, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML tokens ,
, , , and , one can construct simple table structures without any spanning cells. In reality though, one needs at least 28 HTML tokens to describe the most common complex tables observed in real-world documents [21,22], due to a variety of spanning cells definitions in the HTML token vocabulary." }, { "label": "caption", "id": 7, "page_no": 4, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 145.6, "t": 221.1, "r": 469.8, "b": 229.2, "coord_origin": "TOPLEFT" }, "confidence": 0.85, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.6, "r_y0": 229.0, "r_x1": 173.5, "r_y1": 229.0, "r_x2": 173.5, "r_y2": 221.1, "r_x3": 145.6, "r_y3": 221.1, "coord_origin": "TOPLEFT" }, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.6, "r_y0": 229.2, "r_x1": 469.8, "r_y1": 229.2, "r_x2": 469.8, "r_y2": 221.1, "r_x3": 176.6, "r_y3": 221.1, "coord_origin": "TOPLEFT" }, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 2. Frequency of tokens in HTML and OTSL as they appear in PubTabNet." }, { "label": "text", "id": 1, "page_no": 4, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 368.2, "r": 480.6, "b": 532.4, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 377.0, "r_x1": 480.6, "r_y1": 377.0, "r_x2": 480.6, "r_y2": 368.2, "r_x3": 149.7, "r_y3": 368.2, "coord_origin": "TOPLEFT" }, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 389.0, "r_x1": 480.6, "r_y1": 389.0, "r_x2": 480.6, "r_y2": 380.2, "r_x3": 134.8, "r_y3": 380.2, "coord_origin": "TOPLEFT" }, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 400.9, "r_x1": 480.6, "r_y1": 400.9, "r_x2": 480.6, "r_y2": 392.1, "r_x3": 134.8, "r_y3": 392.1, "coord_origin": "TOPLEFT" }, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 412.9, "r_x1": 480.6, "r_y1": 412.9, "r_x2": 480.6, "r_y2": 404.1, "r_x3": 134.8, "r_y3": 404.1, "coord_origin": "TOPLEFT" }, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 424.8, "r_x1": 480.6, "r_y1": 424.8, "r_x2": 480.6, "r_y2": 416.0, "r_x3": 134.8, "r_y3": 416.0, "coord_origin": "TOPLEFT" }, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 436.8, "r_x1": 480.6, "r_y1": 436.8, "r_x2": 480.6, "r_y2": 428.0, "r_x3": 134.8, "r_y3": 428.0, "coord_origin": "TOPLEFT" }, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 448.7, "r_x1": 187.9, "r_y1": 448.7, "r_x2": 187.9, "r_y2": 439.9, "r_x3": 134.8, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.9, "r_y0": 448.7, "r_x1": 211.6, "r_y1": 448.7, "r_x2": 211.6, "r_y2": 439.9, "r_x3": 187.9, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.8, "r_y0": 448.7, "r_x1": 230.8, "r_y1": 448.7, "r_x2": 230.8, "r_y2": 439.9, "r_x3": 214.8, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.8, "r_y0": 448.7, "r_x1": 262.6, "r_y1": 448.7, "r_x2": 262.6, "r_y2": 439.9, "r_x3": 233.8, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.7, "r_y0": 448.7, "r_x1": 480.6, "r_y1": 448.7, "r_x2": 480.6, "r_y2": 439.9, "r_x3": 262.7, "r_y3": 439.9, "coord_origin": "TOPLEFT" }, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 460.7, "r_x1": 480.6, "r_y1": 460.7, "r_x2": 480.6, "r_y2": 451.9, "r_x3": 134.8, "r_y3": 451.9, "coord_origin": "TOPLEFT" }, "text": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "orig": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 472.6, "r_x1": 480.6, "r_y1": 472.6, "r_x2": 480.6, "r_y2": 463.8, "r_x3": 134.8, "r_y3": 463.8, "coord_origin": "TOPLEFT" }, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 484.6, "r_x1": 480.6, "r_y1": 484.6, "r_x2": 480.6, "r_y2": 475.8, "r_x3": 134.8, "r_y3": 475.8, "coord_origin": "TOPLEFT" }, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 496.6, "r_x1": 480.6, "r_y1": 496.6, "r_x2": 480.6, "r_y2": 487.8, "r_x3": 134.8, "r_y3": 487.8, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 508.5, "r_x1": 480.6, "r_y1": 508.5, "r_x2": 480.6, "r_y2": 499.7, "r_x3": 134.8, "r_y3": 499.7, "coord_origin": "TOPLEFT" }, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 520.5, "r_x1": 480.6, "r_y1": 520.5, "r_x2": 480.6, "r_y2": 511.7, "r_x3": 134.8, "r_y3": 511.7, "coord_origin": "TOPLEFT" }, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 532.4, "r_x1": 176.9, "r_y1": 532.4, "r_x2": 176.9, "r_y2": 523.6, "r_x3": 134.8, "r_y3": 523.6, "coord_origin": "TOPLEFT" }, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Obviously, HTML and other general-purpose markup languages were not designed for Im2Seq models. As such, they have some serious drawbacks. First, the token vocabulary needs to be artificially large in order to describe all plausible tabular structures. Since most Im2Seq models use an autoregressive approach, they generate the sequence token by token. Therefore, to reduce inference time, a shorter sequence length is critical. Every table-cell is represented by at least two tokens ( and ). Furthermore, when tokenizing the HTML structure, one needs to explicitly enumerate possible column-spans and row-spans as words. In practice, this ends up requiring 28 different HTML tokens (when including column- and row-spans up to 10 cells) just to describe every table in the PubTabNet dataset. Clearly, not every token is equally represented, as is depicted in Figure 2. This skewed distribution of tokens in combination with variable token row-length makes it challenging for models to learn the HTML structure." }, { "label": "text", "id": 3, "page_no": 4, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.8, "t": 536.0, "r": 480.6, "b": 580.7, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 544.8, "r_x1": 480.6, "r_y1": 544.8, "r_x2": 480.6, "r_y2": 536.0, "r_x3": 149.7, "r_y3": 536.0, "coord_origin": "TOPLEFT" }, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 556.8, "r_x1": 480.6, "r_y1": 556.8, "r_x2": 480.6, "r_y2": 548.0, "r_x3": 134.8, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 568.7, "r_x1": 480.6, "r_y1": 568.7, "r_x2": 480.6, "r_y2": 560.0, "r_x3": 134.8, "r_y3": 560.0, "coord_origin": "TOPLEFT" }, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 580.7, "r_x1": 452.2, "r_y1": 580.7, "r_x2": 452.2, "r_y2": 571.9, "r_x3": 134.8, "r_y3": 571.9, "coord_origin": "TOPLEFT" }, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Additionally, it would be desirable if the representation would easily allow an early detection of invalid sequences on-the-go, before the prediction of the entire table structure is completed. HTML is not well-suited for this purpose as the verification of incomplete sequences is non-trivial or even impossible." }, { "label": "text", "id": 2, "page_no": 4, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 584.3, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 149.7, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "cells, serialised in row-major ordering, where each row and each column have", "orig": "cells, serialised in row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "it is complex to verify the consistency of predicted structures during sequence", "orig": "it is complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table cells, serialised in row-major ordering, where each row and each column have the same length (while considering row- and column-spans). Furthermore, every opening tag in HTML needs to be matched by a closing tag in a correct hierarchical manner. Since the number of tokens for each table row and column can vary significantly, especially for large tables with many row- and column-spans, it is complex to verify the consistency of predicted structures during sequence" }, { "label": "picture", "id": 4, "page_no": 4, "cluster": { "id": 4, "label": "picture", "bbox": { "l": 137.4, "t": 233.5, "r": 476.6, "b": 340.2, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "headers": [ { "label": "page_header", "id": 5, "page_no": 4, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 6, "page_no": 4, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 476.0, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.87, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5" } ] } }, { "page_no": 5, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 364.6, "r_y1": 139.7, "r_x2": 364.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 152.3, "r_x1": 480.6, "r_y1": 152.3, "r_x2": 480.6, "r_y2": 143.5, "r_x3": 149.7, "r_y3": 143.5, "coord_origin": "TOPLEFT" }, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 164.2, "r_x1": 480.6, "r_y1": 164.2, "r_x2": 480.6, "r_y2": 155.4, "r_x3": 134.8, "r_y3": 155.4, "coord_origin": "TOPLEFT" }, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 176.2, "r_x1": 480.6, "r_y1": 176.2, "r_x2": 480.6, "r_y2": 167.4, "r_x3": 134.8, "r_y3": 167.4, "coord_origin": "TOPLEFT" }, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 188.1, "r_x1": 480.6, "r_y1": 188.1, "r_x2": 480.6, "r_y2": 179.3, "r_x3": 134.8, "r_y3": 179.3, "coord_origin": "TOPLEFT" }, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 200.1, "r_x1": 314.3, "r_y1": 200.1, "r_x2": 314.3, "r_y2": 191.3, "r_x3": 134.8, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.1, "r_y0": 200.1, "r_x1": 374.1, "r_y1": 200.1, "r_x2": 374.1, "r_y2": 191.3, "r_x3": 318.1, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 378.8, "r_y0": 200.1, "r_x1": 480.6, "r_y1": 200.1, "r_x2": 480.6, "r_y2": 191.3, "r_x3": 378.8, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 212.1, "r_x1": 480.6, "r_y1": 212.1, "r_x2": 480.6, "r_y2": 203.3, "r_x3": 134.8, "r_y3": 203.3, "coord_origin": "TOPLEFT" }, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 224.0, "r_x1": 480.6, "r_y1": 224.0, "r_x2": 480.6, "r_y2": 215.2, "r_x3": 134.8, "r_y3": 215.2, "coord_origin": "TOPLEFT" }, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 236.0, "r_x1": 480.6, "r_y1": 236.0, "r_x2": 480.6, "r_y2": 227.2, "r_x3": 134.8, "r_y3": 227.2, "coord_origin": "TOPLEFT" }, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 247.9, "r_x1": 480.6, "r_y1": 247.9, "r_x2": 480.6, "r_y2": 239.1, "r_x3": 134.8, "r_y3": 239.1, "coord_origin": "TOPLEFT" }, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 259.9, "r_x1": 480.6, "r_y1": 259.9, "r_x2": 480.6, "r_y2": 251.1, "r_x3": 134.8, "r_y3": 251.1, "coord_origin": "TOPLEFT" }, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 271.8, "r_x1": 480.6, "r_y1": 271.8, "r_x2": 480.6, "r_y2": 263.0, "r_x3": 134.8, "r_y3": 263.0, "coord_origin": "TOPLEFT" }, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.8, "r_x1": 480.6, "r_y1": 283.8, "r_x2": 480.6, "r_y2": 275.0, "r_x3": 134.8, "r_y3": 275.0, "coord_origin": "TOPLEFT" }, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 295.7, "r_x1": 223.6, "r_y1": 295.7, "r_x2": 223.6, "r_y2": 286.9, "r_x3": 134.8, "r_y3": 286.9, "coord_origin": "TOPLEFT" }, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.2, "r_x1": 141.5, "r_y1": 331.2, "r_x2": 141.5, "r_y2": 320.6, "r_x3": 134.8, "r_y3": 320.6, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 331.2, "r_x1": 372.5, "r_y1": 331.2, "r_x2": 372.5, "r_y2": 320.6, "r_x3": 154.9, "r_y3": 320.6, "coord_origin": "TOPLEFT" }, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 357.9, "r_x1": 480.6, "r_y1": 357.9, "r_x2": 480.6, "r_y2": 349.1, "r_x3": 134.8, "r_y3": 349.1, "coord_origin": "TOPLEFT" }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 369.9, "r_x1": 480.6, "r_y1": 369.9, "r_x2": 480.6, "r_y2": 361.1, "r_x3": 134.8, "r_y3": 361.1, "coord_origin": "TOPLEFT" }, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 381.8, "r_x1": 480.6, "r_y1": 381.8, "r_x2": 480.6, "r_y2": 373.0, "r_x3": 134.8, "r_y3": 373.0, "coord_origin": "TOPLEFT" }, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 393.8, "r_x1": 480.6, "r_y1": 393.8, "r_x2": 480.6, "r_y2": 385.0, "r_x3": 134.8, "r_y3": 385.0, "coord_origin": "TOPLEFT" }, "text": "set of rules, which are both significantly reduced compared to HTML. At the", "orig": "set of rules, which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 405.7, "r_x1": 480.6, "r_y1": 405.7, "r_x2": 480.6, "r_y2": 396.9, "r_x3": 134.8, "r_y3": 396.9, "coord_origin": "TOPLEFT" }, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 417.7, "r_x1": 480.6, "r_y1": 417.7, "r_x2": 480.6, "r_y2": 408.9, "r_x3": 134.8, "r_y3": 408.9, "coord_origin": "TOPLEFT" }, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 429.6, "r_x1": 480.6, "r_y1": 429.6, "r_x2": 480.6, "r_y2": 420.8, "r_x3": 134.8, "r_y3": 420.8, "coord_origin": "TOPLEFT" }, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 441.6, "r_x1": 276.7, "r_y1": 441.6, "r_x2": 276.7, "r_y2": 432.8, "r_x3": 134.8, "r_y3": 432.8, "coord_origin": "TOPLEFT" }, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 474.7, "r_x1": 149.4, "r_y1": 474.7, "r_x2": 149.4, "r_y2": 465.9, "r_x3": 134.8, "r_y3": 465.9, "coord_origin": "TOPLEFT" }, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 474.7, "r_x1": 261.8, "r_y1": 474.7, "r_x2": 261.8, "r_y2": 465.9, "r_x3": 160.9, "r_y3": 465.9, "coord_origin": "TOPLEFT" }, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 497.8, "r_x1": 480.6, "r_y1": 497.8, "r_x2": 480.6, "r_y2": 489.0, "r_x3": 134.8, "r_y3": 489.0, "coord_origin": "TOPLEFT" }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 509.7, "r_x1": 480.6, "r_y1": 509.7, "r_x2": 480.6, "r_y2": 501.0, "r_x3": 134.8, "r_y3": 501.0, "coord_origin": "TOPLEFT" }, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 521.7, "r_x1": 154.7, "r_y1": 521.7, "r_x2": 154.7, "r_y2": 512.9, "r_x3": 134.8, "r_y3": 512.9, "coord_origin": "TOPLEFT" }, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 534.3, "r_x1": 409.3, "r_y1": 534.3, "r_x2": 409.3, "r_y2": 525.5, "r_x3": 149.7, "r_y3": 525.5, "coord_origin": "TOPLEFT" }, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 556.8, "r_x1": 146.7, "r_y1": 556.8, "r_x2": 146.7, "r_y2": 548.0, "r_x3": 141.0, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 556.8, "r_x1": 193.2, "r_y1": 556.8, "r_x2": 193.2, "r_y2": 548.0, "r_x3": 151.7, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.5, "r_y0": 556.8, "r_x1": 263.5, "r_y1": 556.8, "r_x2": 263.5, "r_y2": 548.0, "r_x3": 196.5, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.8, "r_y0": 556.8, "r_x1": 460.5, "r_y1": 556.8, "r_x2": 460.5, "r_y2": 548.0, "r_x3": 267.8, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 569.4, "r_x1": 146.7, "r_y1": 569.4, "r_x2": 146.7, "r_y2": 560.6, "r_x3": 141.0, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 569.4, "r_x1": 194.3, "r_y1": 569.4, "r_x2": 194.3, "r_y2": 560.6, "r_x3": 151.7, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.7, "r_y0": 569.4, "r_x1": 264.5, "r_y1": 569.4, "r_x2": 264.5, "r_y2": 560.6, "r_x3": 198.7, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": "left-looking cell", "orig": "left-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.5, "r_y0": 569.4, "r_x1": 480.6, "r_y1": 569.4, "r_x2": 480.6, "r_y2": 560.6, "r_x3": 264.5, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": ", merging with the left neighbor cell to create a", "orig": ", merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 581.3, "r_x1": 171.7, "r_y1": 581.3, "r_x2": 171.7, "r_y2": 572.5, "r_x3": 151.7, "r_y3": 572.5, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 593.9, "r_x1": 146.7, "r_y1": 593.9, "r_x2": 146.7, "r_y2": 585.1, "r_x3": 141.0, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 593.9, "r_x1": 194.1, "r_y1": 593.9, "r_x2": 194.1, "r_y2": 585.1, "r_x3": 151.7, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 197.7, "r_y0": 593.9, "r_x1": 259.9, "r_y1": 593.9, "r_x2": 259.9, "r_y2": 585.1, "r_x3": 197.7, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.9, "r_y0": 593.9, "r_x1": 480.6, "r_y1": 593.9, "r_x2": 480.6, "r_y2": 585.1, "r_x3": 259.9, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": ", merging with the upper neighbor cell to create a", "orig": ", merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 605.9, "r_x1": 171.7, "r_y1": 605.9, "r_x2": 171.7, "r_y2": 597.1, "r_x3": 151.7, "r_y3": 597.1, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 618.5, "r_x1": 146.7, "r_y1": 618.5, "r_x2": 146.7, "r_y2": 609.7, "r_x3": 141.0, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 618.5, "r_x1": 193.5, "r_y1": 618.5, "r_x2": 193.5, "r_y2": 609.7, "r_x3": 151.7, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.8, "r_y0": 618.5, "r_x1": 236.1, "r_y1": 618.5, "r_x2": 236.1, "r_y2": 609.7, "r_x3": 196.8, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.1, "r_y0": 618.5, "r_x1": 454.6, "r_y1": 618.5, "r_x2": 454.6, "r_y2": 609.7, "r_x3": 236.1, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": ", to merge with both left and upper neighbor cells", "orig": ", to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 631.1, "r_x1": 146.7, "r_y1": 631.1, "r_x2": 146.7, "r_y2": 622.3, "r_x3": 141.0, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 631.1, "r_x1": 182.0, "r_y1": 631.1, "r_x2": 182.0, "r_y2": 622.3, "r_x3": 151.7, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.3, "r_y0": 631.1, "r_x1": 221.5, "r_y1": 631.1, "r_x2": 221.5, "r_y2": 622.3, "r_x3": 185.3, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.5, "r_y0": 631.1, "r_x1": 328.6, "r_y1": 631.1, "r_x2": 328.6, "r_y2": 622.3, "r_x3": 221.5, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": ", switch to the next row.", "orig": ", switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 149.7, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 228.2, "r_y1": 664.9, "r_x2": 228.2, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 14, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 139.4, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.84, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 139.7, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 364.6, "r_y1": 139.7, "r_x2": 364.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 143.5, "r": 480.6, "b": 295.7, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 152.3, "r_x1": 480.6, "r_y1": 152.3, "r_x2": 480.6, "r_y2": 143.5, "r_x3": 149.7, "r_y3": 143.5, "coord_origin": "TOPLEFT" }, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 164.2, "r_x1": 480.6, "r_y1": 164.2, "r_x2": 480.6, "r_y2": 155.4, "r_x3": 134.8, "r_y3": 155.4, "coord_origin": "TOPLEFT" }, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 176.2, "r_x1": 480.6, "r_y1": 176.2, "r_x2": 480.6, "r_y2": 167.4, "r_x3": 134.8, "r_y3": 167.4, "coord_origin": "TOPLEFT" }, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 188.1, "r_x1": 480.6, "r_y1": 188.1, "r_x2": 480.6, "r_y2": 179.3, "r_x3": 134.8, "r_y3": 179.3, "coord_origin": "TOPLEFT" }, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 200.1, "r_x1": 314.3, "r_y1": 200.1, "r_x2": 314.3, "r_y2": 191.3, "r_x3": 134.8, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.1, "r_y0": 200.1, "r_x1": 374.1, "r_y1": 200.1, "r_x2": 374.1, "r_y2": 191.3, "r_x3": 318.1, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 378.8, "r_y0": 200.1, "r_x1": 480.6, "r_y1": 200.1, "r_x2": 480.6, "r_y2": 191.3, "r_x3": 378.8, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 212.1, "r_x1": 480.6, "r_y1": 212.1, "r_x2": 480.6, "r_y2": 203.3, "r_x3": 134.8, "r_y3": 203.3, "coord_origin": "TOPLEFT" }, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 224.0, "r_x1": 480.6, "r_y1": 224.0, "r_x2": 480.6, "r_y2": 215.2, "r_x3": 134.8, "r_y3": 215.2, "coord_origin": "TOPLEFT" }, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 236.0, "r_x1": 480.6, "r_y1": 236.0, "r_x2": 480.6, "r_y2": 227.2, "r_x3": 134.8, "r_y3": 227.2, "coord_origin": "TOPLEFT" }, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 247.9, "r_x1": 480.6, "r_y1": 247.9, "r_x2": 480.6, "r_y2": 239.1, "r_x3": 134.8, "r_y3": 239.1, "coord_origin": "TOPLEFT" }, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 259.9, "r_x1": 480.6, "r_y1": 259.9, "r_x2": 480.6, "r_y2": 251.1, "r_x3": 134.8, "r_y3": 251.1, "coord_origin": "TOPLEFT" }, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 271.8, "r_x1": 480.6, "r_y1": 271.8, "r_x2": 480.6, "r_y2": 263.0, "r_x3": 134.8, "r_y3": 263.0, "coord_origin": "TOPLEFT" }, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.8, "r_x1": 480.6, "r_y1": 283.8, "r_x2": 480.6, "r_y2": 275.0, "r_x3": 134.8, "r_y3": 275.0, "coord_origin": "TOPLEFT" }, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 295.7, "r_x1": 223.6, "r_y1": 295.7, "r_x2": 223.6, "r_y2": 286.9, "r_x3": 134.8, "r_y3": 286.9, "coord_origin": "TOPLEFT" }, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "section_header", "bbox": { "l": 134.8, "t": 320.6, "r": 372.5, "b": 331.2, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.2, "r_x1": 141.5, "r_y1": 331.2, "r_x2": 141.5, "r_y2": 320.6, "r_x3": 134.8, "r_y3": 320.6, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 331.2, "r_x1": 372.5, "r_y1": 331.2, "r_x2": 372.5, "r_y2": 320.6, "r_x3": 154.9, "r_y3": 320.6, "coord_origin": "TOPLEFT" }, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 349.1, "r": 480.6, "b": 441.6, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 357.9, "r_x1": 480.6, "r_y1": 357.9, "r_x2": 480.6, "r_y2": 349.1, "r_x3": 134.8, "r_y3": 349.1, "coord_origin": "TOPLEFT" }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 369.9, "r_x1": 480.6, "r_y1": 369.9, "r_x2": 480.6, "r_y2": 361.1, "r_x3": 134.8, "r_y3": 361.1, "coord_origin": "TOPLEFT" }, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 381.8, "r_x1": 480.6, "r_y1": 381.8, "r_x2": 480.6, "r_y2": 373.0, "r_x3": 134.8, "r_y3": 373.0, "coord_origin": "TOPLEFT" }, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 393.8, "r_x1": 480.6, "r_y1": 393.8, "r_x2": 480.6, "r_y2": 385.0, "r_x3": 134.8, "r_y3": 385.0, "coord_origin": "TOPLEFT" }, "text": "set of rules, which are both significantly reduced compared to HTML. At the", "orig": "set of rules, which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 405.7, "r_x1": 480.6, "r_y1": 405.7, "r_x2": 480.6, "r_y2": 396.9, "r_x3": 134.8, "r_y3": 396.9, "coord_origin": "TOPLEFT" }, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 417.7, "r_x1": 480.6, "r_y1": 417.7, "r_x2": 480.6, "r_y2": 408.9, "r_x3": 134.8, "r_y3": 408.9, "coord_origin": "TOPLEFT" }, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 429.6, "r_x1": 480.6, "r_y1": 429.6, "r_x2": 480.6, "r_y2": 420.8, "r_x3": 134.8, "r_y3": 420.8, "coord_origin": "TOPLEFT" }, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 441.6, "r_x1": 276.7, "r_y1": 441.6, "r_x2": 276.7, "r_y2": 432.8, "r_x3": 134.8, "r_y3": 432.8, "coord_origin": "TOPLEFT" }, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "section_header", "bbox": { "l": 134.8, "t": 465.9, "r": 261.8, "b": 474.7, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 474.7, "r_x1": 149.4, "r_y1": 474.7, "r_x2": 149.4, "r_y2": 465.9, "r_x3": 134.8, "r_y3": 465.9, "coord_origin": "TOPLEFT" }, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 474.7, "r_x1": 261.8, "r_y1": 474.7, "r_x2": 261.8, "r_y2": 465.9, "r_x3": 160.9, "r_y3": 465.9, "coord_origin": "TOPLEFT" }, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 489.0, "r": 480.6, "b": 521.7, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 497.8, "r_x1": 480.6, "r_y1": 497.8, "r_x2": 480.6, "r_y2": 489.0, "r_x3": 134.8, "r_y3": 489.0, "coord_origin": "TOPLEFT" }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 509.7, "r_x1": 480.6, "r_y1": 509.7, "r_x2": 480.6, "r_y2": 501.0, "r_x3": 134.8, "r_y3": 501.0, "coord_origin": "TOPLEFT" }, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 521.7, "r_x1": 154.7, "r_y1": 521.7, "r_x2": 154.7, "r_y2": 512.9, "r_x3": 134.8, "r_y3": 512.9, "coord_origin": "TOPLEFT" }, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 149.7, "t": 525.5, "r": 409.3, "b": 534.3, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 534.3, "r_x1": 409.3, "r_y1": 534.3, "r_x2": 409.3, "r_y2": 525.5, "r_x3": 149.7, "r_y3": 525.5, "coord_origin": "TOPLEFT" }, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 141.0, "t": 548.0, "r": 460.5, "b": 556.8, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 556.8, "r_x1": 146.7, "r_y1": 556.8, "r_x2": 146.7, "r_y2": 548.0, "r_x3": 141.0, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 556.8, "r_x1": 193.2, "r_y1": 556.8, "r_x2": 193.2, "r_y2": 548.0, "r_x3": 151.7, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.5, "r_y0": 556.8, "r_x1": 263.5, "r_y1": 556.8, "r_x2": 263.5, "r_y2": 548.0, "r_x3": 196.5, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.8, "r_y0": 556.8, "r_x1": 460.5, "r_y1": 556.8, "r_x2": 460.5, "r_y2": 548.0, "r_x3": 267.8, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 141.0, "t": 560.6, "r": 480.6, "b": 581.3, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 569.4, "r_x1": 146.7, "r_y1": 569.4, "r_x2": 146.7, "r_y2": 560.6, "r_x3": 141.0, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 569.4, "r_x1": 194.3, "r_y1": 569.4, "r_x2": 194.3, "r_y2": 560.6, "r_x3": 151.7, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.7, "r_y0": 569.4, "r_x1": 264.5, "r_y1": 569.4, "r_x2": 264.5, "r_y2": 560.6, "r_x3": 198.7, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": "left-looking cell", "orig": "left-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.5, "r_y0": 569.4, "r_x1": 480.6, "r_y1": 569.4, "r_x2": 480.6, "r_y2": 560.6, "r_x3": 264.5, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": ", merging with the left neighbor cell to create a", "orig": ", merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 581.3, "r_x1": 171.7, "r_y1": 581.3, "r_x2": 171.7, "r_y2": 572.5, "r_x3": 151.7, "r_y3": 572.5, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "list_item", "bbox": { "l": 141.0, "t": 585.1, "r": 480.6, "b": 605.9, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 593.9, "r_x1": 146.7, "r_y1": 593.9, "r_x2": 146.7, "r_y2": 585.1, "r_x3": 141.0, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 593.9, "r_x1": 194.1, "r_y1": 593.9, "r_x2": 194.1, "r_y2": 585.1, "r_x3": 151.7, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 197.7, "r_y0": 593.9, "r_x1": 259.9, "r_y1": 593.9, "r_x2": 259.9, "r_y2": 585.1, "r_x3": 197.7, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.9, "r_y0": 593.9, "r_x1": 480.6, "r_y1": 593.9, "r_x2": 480.6, "r_y2": 585.1, "r_x3": 259.9, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": ", merging with the upper neighbor cell to create a", "orig": ", merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 605.9, "r_x1": 171.7, "r_y1": 605.9, "r_x2": 171.7, "r_y2": 597.1, "r_x3": 151.7, "r_y3": 597.1, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 141.0, "t": 609.7, "r": 454.6, "b": 618.5, "coord_origin": "TOPLEFT" }, "confidence": 0.9, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 618.5, "r_x1": 146.7, "r_y1": 618.5, "r_x2": 146.7, "r_y2": 609.7, "r_x3": 141.0, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 618.5, "r_x1": 193.5, "r_y1": 618.5, "r_x2": 193.5, "r_y2": 609.7, "r_x3": 151.7, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.8, "r_y0": 618.5, "r_x1": 236.1, "r_y1": 618.5, "r_x2": 236.1, "r_y2": 609.7, "r_x3": 196.8, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.1, "r_y0": 618.5, "r_x1": 454.6, "r_y1": 618.5, "r_x2": 454.6, "r_y2": 609.7, "r_x3": 236.1, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": ", to merge with both left and upper neighbor cells", "orig": ", to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "list_item", "bbox": { "l": 141.0, "t": 622.3, "r": 328.6, "b": 631.1, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 631.1, "r_x1": 146.7, "r_y1": 631.1, "r_x2": 146.7, "r_y2": 622.3, "r_x3": 141.0, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 631.1, "r_x1": 182.0, "r_y1": 631.1, "r_x2": 182.0, "r_y2": 622.3, "r_x3": 151.7, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.3, "r_y0": 631.1, "r_x1": 221.5, "r_y1": 631.1, "r_x2": 221.5, "r_y2": 622.3, "r_x3": 185.3, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.5, "r_y0": 631.1, "r_x1": 328.6, "r_y1": 631.1, "r_x2": 328.6, "r_y2": 622.3, "r_x3": 221.5, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": ", switch to the next row.", "orig": ", switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "text", "bbox": { "l": 134.8, "t": 644.1, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 149.7, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 228.2, "r_y1": 664.9, "r_x2": 228.2, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 14, "page_no": 5, "cluster": { "id": 14, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 139.4, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.84, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6" }, { "label": "page_header", "id": 11, "page_no": 5, "cluster": { "id": 11, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "text", "id": 3, "page_no": 5, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 139.7, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 364.6, "r_y1": 139.7, "r_x2": 364.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these complex syntax rules, simply to deliver valid output." }, { "label": "text", "id": 1, "page_no": 5, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 143.5, "r": 480.6, "b": 295.7, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 152.3, "r_x1": 480.6, "r_y1": 152.3, "r_x2": 480.6, "r_y2": 143.5, "r_x3": 149.7, "r_y3": 143.5, "coord_origin": "TOPLEFT" }, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 164.2, "r_x1": 480.6, "r_y1": 164.2, "r_x2": 480.6, "r_y2": 155.4, "r_x3": 134.8, "r_y3": 155.4, "coord_origin": "TOPLEFT" }, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 176.2, "r_x1": 480.6, "r_y1": 176.2, "r_x2": 480.6, "r_y2": 167.4, "r_x3": 134.8, "r_y3": 167.4, "coord_origin": "TOPLEFT" }, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 188.1, "r_x1": 480.6, "r_y1": 188.1, "r_x2": 480.6, "r_y2": 179.3, "r_x3": 134.8, "r_y3": 179.3, "coord_origin": "TOPLEFT" }, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 200.1, "r_x1": 314.3, "r_y1": 200.1, "r_x2": 314.3, "r_y2": 191.3, "r_x3": 134.8, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.1, "r_y0": 200.1, "r_x1": 374.1, "r_y1": 200.1, "r_x2": 374.1, "r_y2": 191.3, "r_x3": 318.1, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 378.8, "r_y0": 200.1, "r_x1": 480.6, "r_y1": 200.1, "r_x2": 480.6, "r_y2": 191.3, "r_x3": 378.8, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 212.1, "r_x1": 480.6, "r_y1": 212.1, "r_x2": 480.6, "r_y2": 203.3, "r_x3": 134.8, "r_y3": 203.3, "coord_origin": "TOPLEFT" }, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 224.0, "r_x1": 480.6, "r_y1": 224.0, "r_x2": 480.6, "r_y2": 215.2, "r_x3": 134.8, "r_y3": 215.2, "coord_origin": "TOPLEFT" }, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 236.0, "r_x1": 480.6, "r_y1": 236.0, "r_x2": 480.6, "r_y2": 227.2, "r_x3": 134.8, "r_y3": 227.2, "coord_origin": "TOPLEFT" }, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 247.9, "r_x1": 480.6, "r_y1": 247.9, "r_x2": 480.6, "r_y2": 239.1, "r_x3": 134.8, "r_y3": 239.1, "coord_origin": "TOPLEFT" }, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 259.9, "r_x1": 480.6, "r_y1": 259.9, "r_x2": 480.6, "r_y2": 251.1, "r_x3": 134.8, "r_y3": 251.1, "coord_origin": "TOPLEFT" }, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 271.8, "r_x1": 480.6, "r_y1": 271.8, "r_x2": 480.6, "r_y2": 263.0, "r_x3": 134.8, "r_y3": 263.0, "coord_origin": "TOPLEFT" }, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.8, "r_x1": 480.6, "r_y1": 283.8, "r_x2": 480.6, "r_y2": 275.0, "r_x3": 134.8, "r_y3": 275.0, "coord_origin": "TOPLEFT" }, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 295.7, "r_x1": 223.6, "r_y1": 295.7, "r_x2": 223.6, "r_y2": 286.9, "r_x3": 134.8, "r_y3": 286.9, "coord_origin": "TOPLEFT" }, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In practice, we observe two major issues with prediction quality when training Im2Seq models on HTML table structure generation from images. On the one hand, we find that on large tables, the visual attention of the model often starts to drift and is not accurately moving forward cell by cell anymore. This manifests itself in either in an increasing location drift for proposed table-cells in later rows on the same column or even complete loss of vertical alignment, as illustrated in Figure 5. Addressing this with post-processing is partially possible, but clearly undesired. On the other hand, we find many instances of predictions with structural inconsistencies or plain invalid HTML output, as shown in Figure 6, which are nearly impossible to properly correct. Both problems seriously impact the TSR model performance, since they reflect not only in the task of pure structure recognition but also in the equally crucial recognition or matching of table cell content." }, { "label": "section_header", "id": 4, "page_no": 5, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 134.8, "t": 320.6, "r": 372.5, "b": 331.2, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.2, "r_x1": 141.5, "r_y1": 331.2, "r_x2": 141.5, "r_y2": 320.6, "r_x3": 134.8, "r_y3": 320.6, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 331.2, "r_x1": 372.5, "r_y1": 331.2, "r_x2": 372.5, "r_y2": 320.6, "r_x3": 154.9, "r_y3": 320.6, "coord_origin": "TOPLEFT" }, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4 Optimised Table Structure Language" }, { "label": "text", "id": 0, "page_no": 5, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 349.1, "r": 480.6, "b": 441.6, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 357.9, "r_x1": 480.6, "r_y1": 357.9, "r_x2": 480.6, "r_y2": 349.1, "r_x3": 134.8, "r_y3": 349.1, "coord_origin": "TOPLEFT" }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 369.9, "r_x1": 480.6, "r_y1": 369.9, "r_x2": 480.6, "r_y2": 361.1, "r_x3": 134.8, "r_y3": 361.1, "coord_origin": "TOPLEFT" }, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 381.8, "r_x1": 480.6, "r_y1": 381.8, "r_x2": 480.6, "r_y2": 373.0, "r_x3": 134.8, "r_y3": 373.0, "coord_origin": "TOPLEFT" }, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 393.8, "r_x1": 480.6, "r_y1": 393.8, "r_x2": 480.6, "r_y2": 385.0, "r_x3": 134.8, "r_y3": 385.0, "coord_origin": "TOPLEFT" }, "text": "set of rules, which are both significantly reduced compared to HTML. At the", "orig": "set of rules, which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 405.7, "r_x1": 480.6, "r_y1": 405.7, "r_x2": 480.6, "r_y2": 396.9, "r_x3": 134.8, "r_y3": 396.9, "coord_origin": "TOPLEFT" }, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 417.7, "r_x1": 480.6, "r_y1": 417.7, "r_x2": 480.6, "r_y2": 408.9, "r_x3": 134.8, "r_y3": 408.9, "coord_origin": "TOPLEFT" }, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 429.6, "r_x1": 480.6, "r_y1": 429.6, "r_x2": 480.6, "r_y2": 420.8, "r_x3": 134.8, "r_y3": 420.8, "coord_origin": "TOPLEFT" }, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 441.6, "r_x1": 276.7, "r_y1": 441.6, "r_x2": 276.7, "r_y2": 432.8, "r_x3": 134.8, "r_y3": 432.8, "coord_origin": "TOPLEFT" }, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before, we propose here our Optimised Table Structure Language (OTSL). OTSL is designed to express table structure with a minimized vocabulary and a simple set of rules, which are both significantly reduced compared to HTML. At the same time, OTSL enables easy error detection and correction during sequence generation. We further demonstrate how the compact structure representation and minimized sequence length improves prediction accuracy and inference time in the TableFormer architecture." }, { "label": "section_header", "id": 5, "page_no": 5, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.8, "t": 465.9, "r": 261.8, "b": 474.7, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 474.7, "r_x1": 149.4, "r_y1": 474.7, "r_x2": 149.4, "r_y2": 465.9, "r_x3": 134.8, "r_y3": 465.9, "coord_origin": "TOPLEFT" }, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 474.7, "r_x1": 261.8, "r_y1": 474.7, "r_x2": 261.8, "r_y2": 465.9, "r_x3": 160.9, "r_y3": 465.9, "coord_origin": "TOPLEFT" }, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.1 Language Definition" }, { "label": "text", "id": 2, "page_no": 5, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 489.0, "r": 480.6, "b": 521.7, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 497.8, "r_x1": 480.6, "r_y1": 497.8, "r_x2": 480.6, "r_y2": 489.0, "r_x3": 134.8, "r_y3": 489.0, "coord_origin": "TOPLEFT" }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 509.7, "r_x1": 480.6, "r_y1": 509.7, "r_x2": 480.6, "r_y2": 501.0, "r_x3": 134.8, "r_y3": 501.0, "coord_origin": "TOPLEFT" }, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 521.7, "r_x1": 154.7, "r_y1": 521.7, "r_x2": 154.7, "r_y2": 512.9, "r_x3": 134.8, "r_y3": 512.9, "coord_origin": "TOPLEFT" }, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines only 5 tokens that directly describe a tabular structure based on an atomic 2D grid." }, { "label": "text", "id": 13, "page_no": 5, "cluster": { "id": 13, "label": "text", "bbox": { "l": 149.7, "t": 525.5, "r": 409.3, "b": 534.3, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 534.3, "r_x1": 409.3, "r_y1": 534.3, "r_x2": 409.3, "r_y2": 525.5, "r_x3": 149.7, "r_y3": 525.5, "coord_origin": "TOPLEFT" }, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The OTSL vocabulary is comprised of the following tokens:" }, { "label": "list_item", "id": 9, "page_no": 5, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 141.0, "t": 548.0, "r": 460.5, "b": 556.8, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 556.8, "r_x1": 146.7, "r_y1": 556.8, "r_x2": 146.7, "r_y2": 548.0, "r_x3": 141.0, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 556.8, "r_x1": 193.2, "r_y1": 556.8, "r_x2": 193.2, "r_y2": 548.0, "r_x3": 151.7, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.5, "r_y0": 556.8, "r_x1": 263.5, "r_y1": 556.8, "r_x2": 263.5, "r_y2": 548.0, "r_x3": 196.5, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.8, "r_y0": 556.8, "r_x1": 460.5, "r_y1": 556.8, "r_x2": 460.5, "r_y2": 548.0, "r_x3": 267.8, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"C\" cell a new table cell that either has or does not have cell content" }, { "label": "list_item", "id": 8, "page_no": 5, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 141.0, "t": 560.6, "r": 480.6, "b": 581.3, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 569.4, "r_x1": 146.7, "r_y1": 569.4, "r_x2": 146.7, "r_y2": 560.6, "r_x3": 141.0, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 569.4, "r_x1": 194.3, "r_y1": 569.4, "r_x2": 194.3, "r_y2": 560.6, "r_x3": 151.7, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.7, "r_y0": 569.4, "r_x1": 264.5, "r_y1": 569.4, "r_x2": 264.5, "r_y2": 560.6, "r_x3": 198.7, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": "left-looking cell", "orig": "left-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.5, "r_y0": 569.4, "r_x1": 480.6, "r_y1": 569.4, "r_x2": 480.6, "r_y2": 560.6, "r_x3": 264.5, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": ", merging with the left neighbor cell to create a", "orig": ", merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 581.3, "r_x1": 171.7, "r_y1": 581.3, "r_x2": 171.7, "r_y2": 572.5, "r_x3": 151.7, "r_y3": 572.5, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"L\" cell left-looking cell , merging with the left neighbor cell to create a span" }, { "label": "list_item", "id": 7, "page_no": 5, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 141.0, "t": 585.1, "r": 480.6, "b": 605.9, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 593.9, "r_x1": 146.7, "r_y1": 593.9, "r_x2": 146.7, "r_y2": 585.1, "r_x3": 141.0, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 593.9, "r_x1": 194.1, "r_y1": 593.9, "r_x2": 194.1, "r_y2": 585.1, "r_x3": 151.7, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 197.7, "r_y0": 593.9, "r_x1": 259.9, "r_y1": 593.9, "r_x2": 259.9, "r_y2": 585.1, "r_x3": 197.7, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.9, "r_y0": 593.9, "r_x1": 480.6, "r_y1": 593.9, "r_x2": 480.6, "r_y2": 585.1, "r_x3": 259.9, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": ", merging with the upper neighbor cell to create a", "orig": ", merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 605.9, "r_x1": 171.7, "r_y1": 605.9, "r_x2": 171.7, "r_y2": 597.1, "r_x3": 151.7, "r_y3": 597.1, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"U\" cell up-looking cell , merging with the upper neighbor cell to create a span" }, { "label": "list_item", "id": 10, "page_no": 5, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 141.0, "t": 609.7, "r": 454.6, "b": 618.5, "coord_origin": "TOPLEFT" }, "confidence": 0.9, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 618.5, "r_x1": 146.7, "r_y1": 618.5, "r_x2": 146.7, "r_y2": 609.7, "r_x3": 141.0, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 618.5, "r_x1": 193.5, "r_y1": 618.5, "r_x2": 193.5, "r_y2": 609.7, "r_x3": 151.7, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.8, "r_y0": 618.5, "r_x1": 236.1, "r_y1": 618.5, "r_x2": 236.1, "r_y2": 609.7, "r_x3": 196.8, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.1, "r_y0": 618.5, "r_x1": 454.6, "r_y1": 618.5, "r_x2": 454.6, "r_y2": 609.7, "r_x3": 236.1, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": ", to merge with both left and upper neighbor cells", "orig": ", to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"X\" cell cross cell , to merge with both left and upper neighbor cells" }, { "label": "list_item", "id": 12, "page_no": 5, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 141.0, "t": 622.3, "r": 328.6, "b": 631.1, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 631.1, "r_x1": 146.7, "r_y1": 631.1, "r_x2": 146.7, "r_y2": 622.3, "r_x3": 141.0, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 631.1, "r_x1": 182.0, "r_y1": 631.1, "r_x2": 182.0, "r_y2": 622.3, "r_x3": 151.7, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.3, "r_y0": 631.1, "r_x1": 221.5, "r_y1": 631.1, "r_x2": 221.5, "r_y2": 622.3, "r_x3": 185.3, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.5, "r_y0": 631.1, "r_x1": 328.6, "r_y1": 631.1, "r_x2": 328.6, "r_y2": 622.3, "r_x3": 221.5, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": ", switch to the next row.", "orig": ", switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"NL\" new-line , switch to the next row." }, { "label": "text", "id": 6, "page_no": 5, "cluster": { "id": 6, "label": "text", "bbox": { "l": 134.8, "t": 644.1, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 149.7, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 228.2, "r_y1": 664.9, "r_x2": 228.2, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless conversion to HTML." } ], "body": [ { "label": "text", "id": 3, "page_no": 5, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 139.7, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 364.6, "r_y1": 139.7, "r_x2": 364.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these complex syntax rules, simply to deliver valid output." }, { "label": "text", "id": 1, "page_no": 5, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 143.5, "r": 480.6, "b": 295.7, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 152.3, "r_x1": 480.6, "r_y1": 152.3, "r_x2": 480.6, "r_y2": 143.5, "r_x3": 149.7, "r_y3": 143.5, "coord_origin": "TOPLEFT" }, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 164.2, "r_x1": 480.6, "r_y1": 164.2, "r_x2": 480.6, "r_y2": 155.4, "r_x3": 134.8, "r_y3": 155.4, "coord_origin": "TOPLEFT" }, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 176.2, "r_x1": 480.6, "r_y1": 176.2, "r_x2": 480.6, "r_y2": 167.4, "r_x3": 134.8, "r_y3": 167.4, "coord_origin": "TOPLEFT" }, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 188.1, "r_x1": 480.6, "r_y1": 188.1, "r_x2": 480.6, "r_y2": 179.3, "r_x3": 134.8, "r_y3": 179.3, "coord_origin": "TOPLEFT" }, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 200.1, "r_x1": 314.3, "r_y1": 200.1, "r_x2": 314.3, "r_y2": 191.3, "r_x3": 134.8, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.1, "r_y0": 200.1, "r_x1": 374.1, "r_y1": 200.1, "r_x2": 374.1, "r_y2": 191.3, "r_x3": 318.1, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 378.8, "r_y0": 200.1, "r_x1": 480.6, "r_y1": 200.1, "r_x2": 480.6, "r_y2": 191.3, "r_x3": 378.8, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 212.1, "r_x1": 480.6, "r_y1": 212.1, "r_x2": 480.6, "r_y2": 203.3, "r_x3": 134.8, "r_y3": 203.3, "coord_origin": "TOPLEFT" }, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 224.0, "r_x1": 480.6, "r_y1": 224.0, "r_x2": 480.6, "r_y2": 215.2, "r_x3": 134.8, "r_y3": 215.2, "coord_origin": "TOPLEFT" }, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 236.0, "r_x1": 480.6, "r_y1": 236.0, "r_x2": 480.6, "r_y2": 227.2, "r_x3": 134.8, "r_y3": 227.2, "coord_origin": "TOPLEFT" }, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 247.9, "r_x1": 480.6, "r_y1": 247.9, "r_x2": 480.6, "r_y2": 239.1, "r_x3": 134.8, "r_y3": 239.1, "coord_origin": "TOPLEFT" }, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 259.9, "r_x1": 480.6, "r_y1": 259.9, "r_x2": 480.6, "r_y2": 251.1, "r_x3": 134.8, "r_y3": 251.1, "coord_origin": "TOPLEFT" }, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 271.8, "r_x1": 480.6, "r_y1": 271.8, "r_x2": 480.6, "r_y2": 263.0, "r_x3": 134.8, "r_y3": 263.0, "coord_origin": "TOPLEFT" }, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.8, "r_x1": 480.6, "r_y1": 283.8, "r_x2": 480.6, "r_y2": 275.0, "r_x3": 134.8, "r_y3": 275.0, "coord_origin": "TOPLEFT" }, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 295.7, "r_x1": 223.6, "r_y1": 295.7, "r_x2": 223.6, "r_y2": 286.9, "r_x3": 134.8, "r_y3": 286.9, "coord_origin": "TOPLEFT" }, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In practice, we observe two major issues with prediction quality when training Im2Seq models on HTML table structure generation from images. On the one hand, we find that on large tables, the visual attention of the model often starts to drift and is not accurately moving forward cell by cell anymore. This manifests itself in either in an increasing location drift for proposed table-cells in later rows on the same column or even complete loss of vertical alignment, as illustrated in Figure 5. Addressing this with post-processing is partially possible, but clearly undesired. On the other hand, we find many instances of predictions with structural inconsistencies or plain invalid HTML output, as shown in Figure 6, which are nearly impossible to properly correct. Both problems seriously impact the TSR model performance, since they reflect not only in the task of pure structure recognition but also in the equally crucial recognition or matching of table cell content." }, { "label": "section_header", "id": 4, "page_no": 5, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 134.8, "t": 320.6, "r": 372.5, "b": 331.2, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.2, "r_x1": 141.5, "r_y1": 331.2, "r_x2": 141.5, "r_y2": 320.6, "r_x3": 134.8, "r_y3": 320.6, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 331.2, "r_x1": 372.5, "r_y1": 331.2, "r_x2": 372.5, "r_y2": 320.6, "r_x3": 154.9, "r_y3": 320.6, "coord_origin": "TOPLEFT" }, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4 Optimised Table Structure Language" }, { "label": "text", "id": 0, "page_no": 5, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 349.1, "r": 480.6, "b": 441.6, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 357.9, "r_x1": 480.6, "r_y1": 357.9, "r_x2": 480.6, "r_y2": 349.1, "r_x3": 134.8, "r_y3": 349.1, "coord_origin": "TOPLEFT" }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 369.9, "r_x1": 480.6, "r_y1": 369.9, "r_x2": 480.6, "r_y2": 361.1, "r_x3": 134.8, "r_y3": 361.1, "coord_origin": "TOPLEFT" }, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 381.8, "r_x1": 480.6, "r_y1": 381.8, "r_x2": 480.6, "r_y2": 373.0, "r_x3": 134.8, "r_y3": 373.0, "coord_origin": "TOPLEFT" }, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 393.8, "r_x1": 480.6, "r_y1": 393.8, "r_x2": 480.6, "r_y2": 385.0, "r_x3": 134.8, "r_y3": 385.0, "coord_origin": "TOPLEFT" }, "text": "set of rules, which are both significantly reduced compared to HTML. At the", "orig": "set of rules, which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 405.7, "r_x1": 480.6, "r_y1": 405.7, "r_x2": 480.6, "r_y2": 396.9, "r_x3": 134.8, "r_y3": 396.9, "coord_origin": "TOPLEFT" }, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 417.7, "r_x1": 480.6, "r_y1": 417.7, "r_x2": 480.6, "r_y2": 408.9, "r_x3": 134.8, "r_y3": 408.9, "coord_origin": "TOPLEFT" }, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 429.6, "r_x1": 480.6, "r_y1": 429.6, "r_x2": 480.6, "r_y2": 420.8, "r_x3": 134.8, "r_y3": 420.8, "coord_origin": "TOPLEFT" }, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 441.6, "r_x1": 276.7, "r_y1": 441.6, "r_x2": 276.7, "r_y2": 432.8, "r_x3": 134.8, "r_y3": 432.8, "coord_origin": "TOPLEFT" }, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before, we propose here our Optimised Table Structure Language (OTSL). OTSL is designed to express table structure with a minimized vocabulary and a simple set of rules, which are both significantly reduced compared to HTML. At the same time, OTSL enables easy error detection and correction during sequence generation. We further demonstrate how the compact structure representation and minimized sequence length improves prediction accuracy and inference time in the TableFormer architecture." }, { "label": "section_header", "id": 5, "page_no": 5, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.8, "t": 465.9, "r": 261.8, "b": 474.7, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 474.7, "r_x1": 149.4, "r_y1": 474.7, "r_x2": 149.4, "r_y2": 465.9, "r_x3": 134.8, "r_y3": 465.9, "coord_origin": "TOPLEFT" }, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 474.7, "r_x1": 261.8, "r_y1": 474.7, "r_x2": 261.8, "r_y2": 465.9, "r_x3": 160.9, "r_y3": 465.9, "coord_origin": "TOPLEFT" }, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.1 Language Definition" }, { "label": "text", "id": 2, "page_no": 5, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 489.0, "r": 480.6, "b": 521.7, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 497.8, "r_x1": 480.6, "r_y1": 497.8, "r_x2": 480.6, "r_y2": 489.0, "r_x3": 134.8, "r_y3": 489.0, "coord_origin": "TOPLEFT" }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 509.7, "r_x1": 480.6, "r_y1": 509.7, "r_x2": 480.6, "r_y2": 501.0, "r_x3": 134.8, "r_y3": 501.0, "coord_origin": "TOPLEFT" }, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 521.7, "r_x1": 154.7, "r_y1": 521.7, "r_x2": 154.7, "r_y2": 512.9, "r_x3": 134.8, "r_y3": 512.9, "coord_origin": "TOPLEFT" }, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines only 5 tokens that directly describe a tabular structure based on an atomic 2D grid." }, { "label": "text", "id": 13, "page_no": 5, "cluster": { "id": 13, "label": "text", "bbox": { "l": 149.7, "t": 525.5, "r": 409.3, "b": 534.3, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 534.3, "r_x1": 409.3, "r_y1": 534.3, "r_x2": 409.3, "r_y2": 525.5, "r_x3": 149.7, "r_y3": 525.5, "coord_origin": "TOPLEFT" }, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The OTSL vocabulary is comprised of the following tokens:" }, { "label": "list_item", "id": 9, "page_no": 5, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 141.0, "t": 548.0, "r": 460.5, "b": 556.8, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 556.8, "r_x1": 146.7, "r_y1": 556.8, "r_x2": 146.7, "r_y2": 548.0, "r_x3": 141.0, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 556.8, "r_x1": 193.2, "r_y1": 556.8, "r_x2": 193.2, "r_y2": 548.0, "r_x3": 151.7, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.5, "r_y0": 556.8, "r_x1": 263.5, "r_y1": 556.8, "r_x2": 263.5, "r_y2": 548.0, "r_x3": 196.5, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.8, "r_y0": 556.8, "r_x1": 460.5, "r_y1": 556.8, "r_x2": 460.5, "r_y2": 548.0, "r_x3": 267.8, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"C\" cell a new table cell that either has or does not have cell content" }, { "label": "list_item", "id": 8, "page_no": 5, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 141.0, "t": 560.6, "r": 480.6, "b": 581.3, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 569.4, "r_x1": 146.7, "r_y1": 569.4, "r_x2": 146.7, "r_y2": 560.6, "r_x3": 141.0, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 569.4, "r_x1": 194.3, "r_y1": 569.4, "r_x2": 194.3, "r_y2": 560.6, "r_x3": 151.7, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.7, "r_y0": 569.4, "r_x1": 264.5, "r_y1": 569.4, "r_x2": 264.5, "r_y2": 560.6, "r_x3": 198.7, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": "left-looking cell", "orig": "left-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.5, "r_y0": 569.4, "r_x1": 480.6, "r_y1": 569.4, "r_x2": 480.6, "r_y2": 560.6, "r_x3": 264.5, "r_y3": 560.6, "coord_origin": "TOPLEFT" }, "text": ", merging with the left neighbor cell to create a", "orig": ", merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 581.3, "r_x1": 171.7, "r_y1": 581.3, "r_x2": 171.7, "r_y2": 572.5, "r_x3": 151.7, "r_y3": 572.5, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"L\" cell left-looking cell , merging with the left neighbor cell to create a span" }, { "label": "list_item", "id": 7, "page_no": 5, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 141.0, "t": 585.1, "r": 480.6, "b": 605.9, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 593.9, "r_x1": 146.7, "r_y1": 593.9, "r_x2": 146.7, "r_y2": 585.1, "r_x3": 141.0, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 593.9, "r_x1": 194.1, "r_y1": 593.9, "r_x2": 194.1, "r_y2": 585.1, "r_x3": 151.7, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 197.7, "r_y0": 593.9, "r_x1": 259.9, "r_y1": 593.9, "r_x2": 259.9, "r_y2": 585.1, "r_x3": 197.7, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.9, "r_y0": 593.9, "r_x1": 480.6, "r_y1": 593.9, "r_x2": 480.6, "r_y2": 585.1, "r_x3": 259.9, "r_y3": 585.1, "coord_origin": "TOPLEFT" }, "text": ", merging with the upper neighbor cell to create a", "orig": ", merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 605.9, "r_x1": 171.7, "r_y1": 605.9, "r_x2": 171.7, "r_y2": 597.1, "r_x3": 151.7, "r_y3": 597.1, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"U\" cell up-looking cell , merging with the upper neighbor cell to create a span" }, { "label": "list_item", "id": 10, "page_no": 5, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 141.0, "t": 609.7, "r": 454.6, "b": 618.5, "coord_origin": "TOPLEFT" }, "confidence": 0.9, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 618.5, "r_x1": 146.7, "r_y1": 618.5, "r_x2": 146.7, "r_y2": 609.7, "r_x3": 141.0, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 618.5, "r_x1": 193.5, "r_y1": 618.5, "r_x2": 193.5, "r_y2": 609.7, "r_x3": 151.7, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.8, "r_y0": 618.5, "r_x1": 236.1, "r_y1": 618.5, "r_x2": 236.1, "r_y2": 609.7, "r_x3": 196.8, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.1, "r_y0": 618.5, "r_x1": 454.6, "r_y1": 618.5, "r_x2": 454.6, "r_y2": 609.7, "r_x3": 236.1, "r_y3": 609.7, "coord_origin": "TOPLEFT" }, "text": ", to merge with both left and upper neighbor cells", "orig": ", to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"X\" cell cross cell , to merge with both left and upper neighbor cells" }, { "label": "list_item", "id": 12, "page_no": 5, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 141.0, "t": 622.3, "r": 328.6, "b": 631.1, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 141.0, "r_y0": 631.1, "r_x1": 146.7, "r_y1": 631.1, "r_x2": 146.7, "r_y2": 622.3, "r_x3": 141.0, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 631.1, "r_x1": 182.0, "r_y1": 631.1, "r_x2": 182.0, "r_y2": 622.3, "r_x3": 151.7, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.3, "r_y0": 631.1, "r_x1": 221.5, "r_y1": 631.1, "r_x2": 221.5, "r_y2": 622.3, "r_x3": 185.3, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.5, "r_y0": 631.1, "r_x1": 328.6, "r_y1": 631.1, "r_x2": 328.6, "r_y2": 622.3, "r_x3": 221.5, "r_y3": 622.3, "coord_origin": "TOPLEFT" }, "text": ", switch to the next row.", "orig": ", switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"NL\" new-line , switch to the next row." }, { "label": "text", "id": 6, "page_no": 5, "cluster": { "id": 6, "label": "text", "bbox": { "l": 134.8, "t": 644.1, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 149.7, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 228.2, "r_y1": 664.9, "r_x2": 228.2, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless conversion to HTML." } ], "headers": [ { "label": "page_header", "id": 14, "page_no": 5, "cluster": { "id": 14, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 139.4, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.84, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6" }, { "label": "page_header", "id": 11, "page_no": 5, "cluster": { "id": 11, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 6, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 133.7, "r_x1": 162.6, "r_y1": 133.7, "r_x2": 162.6, "r_y2": 125.8, "r_x3": 134.8, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.3, "r_y0": 133.9, "r_x1": 480.6, "r_y1": 133.9, "r_x2": 480.6, "r_y2": 125.9, "r_x3": 166.3, "r_y3": 125.9, "coord_origin": "TOPLEFT" }, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 144.9, "r_x1": 480.6, "r_y1": 144.9, "r_x2": 480.6, "r_y2": 136.8, "r_x3": 134.8, "r_y3": 136.8, "coord_origin": "TOPLEFT" }, "text": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "orig": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 155.8, "r_x1": 306.1, "r_y1": 155.8, "r_x2": 306.1, "r_y2": 147.8, "r_x3": 134.8, "r_y3": 147.8, "coord_origin": "TOPLEFT" }, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.5, "r_y0": 177.9, "r_x1": 381.7, "r_y1": 177.9, "r_x2": 381.7, "r_y2": 168.6, "r_x3": 374.5, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 177.8, "r_x1": 405.9, "r_y1": 177.8, "r_x2": 405.9, "r_y2": 168.5, "r_x3": 398.7, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.8, "r_y0": 202.2, "r_x1": 380.9, "r_y1": 202.2, "r_x2": 380.9, "r_y2": 192.9, "r_x3": 373.8, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 202.4, "r_x1": 393.8, "r_y1": 202.4, "r_x2": 393.8, "r_y2": 193.1, "r_x3": 386.7, "r_y3": 193.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 214.5, "r_x1": 393.9, "r_y1": 214.5, "r_x2": 393.9, "r_y2": 205.1, "r_x3": 386.7, "r_y3": 205.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 190.1, "r_x1": 405.8, "r_y1": 190.1, "r_x2": 405.8, "r_y2": 180.7, "r_x3": 398.7, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.8, "r_y0": 190.1, "r_x1": 418.0, "r_y1": 190.1, "r_x2": 418.0, "r_y2": 180.7, "r_x3": 410.8, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.9, "r_y0": 190.0, "r_x1": 430.1, "r_y1": 190.0, "r_x2": 430.1, "r_y2": 180.7, "r_x3": 422.9, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 202.3, "r_x1": 406.0, "r_y1": 202.3, "r_x2": 406.0, "r_y2": 193.0, "r_x3": 398.8, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.3, "r_x1": 418.1, "r_y1": 202.3, "r_x2": 418.1, "r_y2": 193.0, "r_x3": 410.9, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 202.2, "r_x1": 430.2, "r_y1": 202.2, "r_x2": 430.2, "r_y2": 192.9, "r_x3": 423.0, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 214.6, "r_x1": 406.0, "r_y1": 214.6, "r_x2": 406.0, "r_y2": 205.3, "r_x3": 398.8, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.6, "r_x1": 418.1, "r_y1": 214.6, "r_x2": 418.1, "r_y2": 205.3, "r_x3": 410.9, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 214.6, "r_x1": 430.2, "r_y1": 214.6, "r_x2": 430.2, "r_y2": 205.2, "r_x3": 423.0, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.5, "r_y0": 226.4, "r_x1": 393.7, "r_y1": 226.4, "r_x2": 393.7, "r_y2": 217.0, "r_x3": 386.5, "r_y3": 217.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.5, "r_x1": 405.8, "r_y1": 226.5, "r_x2": 405.8, "r_y2": 217.2, "r_x3": 398.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.7, "r_y0": 226.5, "r_x1": 417.9, "r_y1": 226.5, "r_x2": 417.9, "r_y2": 217.2, "r_x3": 410.7, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.8, "r_y0": 226.5, "r_x1": 430.0, "r_y1": 226.5, "r_x2": 430.0, "r_y2": 217.1, "r_x3": 422.8, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.2, "r_y0": 177.0, "r_x1": 447.9, "r_y1": 177.0, "r_x2": 447.9, "r_y2": 167.7, "r_x3": 435.2, "r_y3": 167.7, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 189.5, "r_x1": 448.1, "r_y1": 189.5, "r_x2": 448.1, "r_y2": 180.2, "r_x3": 435.4, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 201.8, "r_x1": 448.2, "r_y1": 201.8, "r_x2": 448.2, "r_y2": 192.5, "r_x3": 435.5, "r_y3": 192.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 214.2, "r_x1": 448.1, "r_y1": 214.2, "r_x2": 448.1, "r_y2": 204.8, "r_x3": 435.4, "r_y3": 204.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.6, "r_x1": 448.3, "r_y1": 226.6, "r_x2": 448.3, "r_y2": 217.2, "r_x3": 435.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.1, "r_y0": 214.6, "r_x1": 381.3, "r_y1": 214.6, "r_x2": 381.3, "r_y2": 205.2, "r_x3": 374.1, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0, "r_y0": 226.5, "r_x1": 381.2, "r_y1": 226.5, "r_x2": 381.2, "r_y2": 217.1, "r_x3": 374.0, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.3, "r_y0": 190.3, "r_x1": 381.5, "r_y1": 190.3, "r_x2": 381.5, "r_y2": 180.9, "r_x3": 374.3, "r_y3": 180.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.8, "r_y0": 177.9, "r_x1": 393.3, "r_y1": 177.9, "r_x2": 393.3, "r_y2": 168.6, "r_x3": 387.8, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.9, "r_y0": 177.4, "r_x1": 417.4, "r_y1": 177.4, "r_x2": 417.4, "r_y2": 168.1, "r_x3": 411.9, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.3, "r_y0": 177.3, "r_x1": 428.9, "r_y1": 177.3, "r_x2": 428.9, "r_y2": 167.9, "r_x3": 423.3, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.1, "r_y0": 190.1, "r_x1": 393.8, "r_y1": 190.1, "r_x2": 393.8, "r_y2": 180.8, "r_x3": 387.1, "r_y3": 180.8, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.3, "r_y0": 253.8, "r_x1": 289.4, "r_y1": 253.8, "r_x2": 289.4, "r_y2": 244.5, "r_x3": 282.3, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.1, "r_y0": 266.2, "r_x1": 289.3, "r_y1": 266.2, "r_x2": 289.3, "r_y2": 256.9, "r_x3": 282.1, "r_y3": 256.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.4, "r_y0": 278.5, "r_x1": 289.6, "r_y1": 278.5, "r_x2": 289.6, "r_y2": 269.1, "r_x3": 282.4, "r_y3": 269.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.5, "r_y0": 253.8, "r_x1": 301.1, "r_y1": 253.8, "r_x2": 301.1, "r_y2": 244.5, "r_x3": 295.5, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.5, "r_y0": 253.9, "r_x1": 313.0, "r_y1": 253.9, "r_x2": 313.0, "r_y2": 244.6, "r_x3": 307.5, "r_y3": 244.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.8, "r_y0": 253.8, "r_x1": 324.3, "r_y1": 253.8, "r_x2": 324.3, "r_y2": 244.4, "r_x3": 318.8, "r_y3": 244.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.0, "r_x1": 301.0, "r_y1": 266.0, "r_x2": 301.0, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.2, "r_y0": 266.0, "r_x1": 325.6, "r_y1": 266.0, "r_x2": 325.6, "r_y2": 256.7, "r_x3": 307.2, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.8, "r_y0": 278.6, "r_x1": 300.9, "r_y1": 278.6, "r_x2": 300.9, "r_y2": 269.3, "r_x3": 294.8, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.1, "r_y0": 278.6, "r_x1": 325.5, "r_y1": 278.6, "r_x2": 325.5, "r_y2": 269.3, "r_x3": 307.1, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 278.1, "r_x1": 203.1, "r_y1": 278.1, "r_x2": 203.1, "r_y2": 268.7, "r_x3": 195.9, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.2, "r_y0": 278.1, "r_x1": 214.7, "r_y1": 278.1, "r_x2": 214.7, "r_y2": 268.7, "r_x3": 209.2, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.1, "r_y0": 278.1, "r_x1": 226.7, "r_y1": 278.1, "r_x2": 226.7, "r_y2": 268.8, "r_x3": 221.1, "r_y3": 268.8, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.4, "r_y0": 278.0, "r_x1": 238.0, "r_y1": 278.0, "r_x2": 238.0, "r_y2": 268.7, "r_x3": 232.4, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.2, "r_y0": 253.9, "r_x1": 203.4, "r_y1": 253.9, "r_x2": 203.4, "r_y2": 244.5, "r_x3": 196.2, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.3, "r_y0": 253.4, "r_x1": 257.5, "r_y1": 253.4, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.3, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.2, "r_y0": 265.8, "r_x1": 257.3, "r_y1": 265.8, "r_x2": 257.3, "r_y2": 256.4, "r_x3": 250.2, "r_y3": 256.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.5, "r_y0": 278.0, "r_x1": 257.6, "r_y1": 278.0, "r_x2": 257.6, "r_y2": 268.7, "r_x3": 250.5, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 249.2, "r_x1": 337.2, "r_y1": 249.2, "r_x2": 337.2, "r_y2": 243.0, "r_x3": 334.5, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.9, "r_y0": 249.2, "r_x1": 391.5, "r_y1": 249.2, "r_x2": 391.5, "r_y2": 243.0, "r_x3": 339.9, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 259.1, "r_x1": 337.3, "r_y1": 259.1, "r_x2": 337.3, "r_y2": 252.9, "r_x3": 334.5, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.2, "r_y0": 259.1, "r_x1": 422.0, "r_y1": 259.1, "r_x2": 422.0, "r_y2": 252.9, "r_x3": 340.2, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 269.1, "r_x1": 337.3, "r_y1": 269.1, "r_x2": 337.3, "r_y2": 262.9, "r_x3": 334.5, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 269.1, "r_x1": 415.3, "r_y1": 269.1, "r_x2": 415.3, "r_y2": 262.9, "r_x3": 340.1, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 279.0, "r_x1": 337.3, "r_y1": 279.0, "r_x2": 337.3, "r_y2": 272.8, "r_x3": 334.5, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 279.0, "r_x1": 426.6, "r_y1": 279.0, "r_x2": 426.6, "r_y2": 272.8, "r_x3": 340.1, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.7, "r_y0": 250.3, "r_x1": 189.4, "r_y1": 250.3, "r_x2": 189.4, "r_y2": 244.0, "r_x3": 185.7, "r_y3": 244.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.0, "r_y0": 274.6, "r_x1": 189.7, "r_y1": 274.6, "r_x2": 189.7, "r_y2": 268.3, "r_x3": 186.0, "r_y3": 268.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.3, "r_y0": 249.8, "r_x1": 243.0, "r_y1": 249.8, "r_x2": 243.0, "r_y2": 243.6, "r_x3": 239.3, "r_y3": 243.6, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 249.7, "r_x1": 275.0, "r_y1": 249.7, "r_x2": 275.0, "r_y2": 243.5, "r_x3": 271.3, "r_y3": 243.5, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.8, "r_y0": 172.7, "r_x1": 233.5, "r_y1": 172.7, "r_x2": 233.5, "r_y2": 166.5, "r_x3": 229.8, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.2, "r_y0": 196.2, "r_x1": 260.9, "r_y1": 196.2, "r_x2": 260.9, "r_y2": 190.0, "r_x3": 257.2, "r_y3": 190.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.9, "r_y0": 184.2, "r_x1": 190.6, "r_y1": 184.2, "r_x2": 190.6, "r_y2": 178.0, "r_x3": 186.9, "r_y3": 178.0, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.5, "r_y0": 175.2, "r_x1": 200.2, "r_y1": 175.2, "r_x2": 200.2, "r_y2": 169.0, "r_x3": 196.5, "r_y3": 169.0, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 175.7, "r_x1": 175.7, "r_y1": 175.7, "r_x2": 175.7, "r_y2": 167.9, "r_x3": 169.7, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 214.6, "r_x1": 175.7, "r_y1": 214.6, "r_x2": 175.7, "r_y2": 206.8, "r_x3": 169.7, "r_y3": 206.8, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.3, "r_y0": 176.0, "r_x1": 280.3, "r_y1": 176.0, "r_x2": 280.3, "r_y2": 168.3, "r_x3": 274.3, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.6, "r_y0": 176.0, "r_x1": 365.5, "r_y1": 176.0, "r_x2": 365.5, "r_y2": 168.3, "r_x3": 359.6, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 251.0, "r_x1": 175.3, "r_y1": 251.0, "r_x2": 175.3, "r_y2": 243.2, "r_x3": 169.7, "r_y3": 243.2, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 314.1, "r_x1": 149.4, "r_y1": 314.1, "r_x2": 149.4, "r_y2": 305.3, "r_x3": 134.8, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 314.1, "r_x1": 246.7, "r_y1": 314.1, "r_x2": 246.7, "r_y2": 305.3, "r_x3": 160.9, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 334.0, "r_x1": 363.8, "r_y1": 334.0, "r_x2": 363.8, "r_y2": 325.2, "r_x3": 134.8, "r_y3": 325.2, "coord_origin": "TOPLEFT" }, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 356.0, "r_x1": 146.7, "r_y1": 356.0, "r_x2": 146.7, "r_y2": 347.2, "r_x3": 139.0, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 356.0, "r_x1": 257.4, "r_y1": 356.0, "r_x2": 257.4, "r_y2": 347.2, "r_x3": 151.7, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.4, "r_y0": 356.0, "r_x1": 480.6, "r_y1": 356.0, "r_x2": 480.6, "r_y2": 347.2, "r_x3": 257.4, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": ": The left neighbour of an \"L\" cell must be either", "orig": ": The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 367.9, "r_x1": 283.6, "r_y1": 367.9, "r_x2": 283.6, "r_y2": 359.1, "r_x3": 151.7, "r_y3": 359.1, "coord_origin": "TOPLEFT" }, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 379.9, "r_x1": 146.7, "r_y1": 379.9, "r_x2": 146.7, "r_y2": 371.1, "r_x3": 139.0, "r_y3": 371.1, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 379.9, "r_x1": 252.1, "r_y1": 379.9, "r_x2": 252.1, "r_y2": 371.1, "r_x3": 151.7, "r_y3": 371.1, "coord_origin": "TOPLEFT" }, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.1, "r_y0": 379.9, "r_x1": 480.6, "r_y1": 379.9, "r_x2": 480.6, "r_y2": 371.1, "r_x3": 252.1, "r_y3": 371.1, "coord_origin": "TOPLEFT" }, "text": ": The upper neighbour of a \"U\" cell must be either", "orig": ": The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 391.8, "r_x1": 284.8, "r_y1": 391.8, "r_x2": 284.8, "r_y2": 383.0, "r_x3": 151.7, "r_y3": 383.0, "coord_origin": "TOPLEFT" }, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 403.8, "r_x1": 146.7, "r_y1": 403.8, "r_x2": 146.7, "r_y2": 395.0, "r_x3": 139.0, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 403.8, "r_x1": 223.3, "r_y1": 403.8, "r_x2": 223.3, "r_y2": 395.0, "r_x3": 151.7, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.3, "r_y0": 403.8, "r_x1": 226.1, "r_y1": 403.8, "r_x2": 226.1, "r_y2": 395.0, "r_x3": 223.3, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 415.8, "r_x1": 480.6, "r_y1": 415.8, "r_x2": 480.6, "r_y2": 407.0, "r_x3": 151.7, "r_y3": 407.0, "coord_origin": "TOPLEFT" }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 427.7, "r_x1": 480.6, "r_y1": 427.7, "r_x2": 480.6, "r_y2": 418.9, "r_x3": 151.7, "r_y3": 418.9, "coord_origin": "TOPLEFT" }, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 439.7, "r_x1": 214.4, "r_y1": 439.7, "r_x2": 214.4, "r_y2": 430.9, "r_x3": 151.7, "r_y3": 430.9, "coord_origin": "TOPLEFT" }, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 451.6, "r_x1": 146.7, "r_y1": 451.6, "r_x2": 146.7, "r_y2": 442.8, "r_x3": 139.0, "r_y3": 442.8, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 451.6, "r_x1": 221.3, "r_y1": 451.6, "r_x2": 221.3, "r_y2": 442.8, "r_x3": 151.7, "r_y3": 442.8, "coord_origin": "TOPLEFT" }, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.3, "r_y0": 451.6, "r_x1": 474.6, "r_y1": 451.6, "r_x2": 474.6, "r_y2": 442.8, "r_x3": 221.3, "r_y3": 442.8, "coord_origin": "TOPLEFT" }, "text": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 463.6, "r_x1": 146.7, "r_y1": 463.6, "r_x2": 146.7, "r_y2": 454.8, "r_x3": 139.0, "r_y3": 454.8, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 463.6, "r_x1": 240.7, "r_y1": 463.6, "r_x2": 240.7, "r_y2": 454.8, "r_x3": 151.7, "r_y3": 454.8, "coord_origin": "TOPLEFT" }, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.7, "r_y0": 463.6, "r_x1": 480.6, "r_y1": 463.6, "r_x2": 480.6, "r_y2": 454.8, "r_x3": 240.7, "r_y3": 454.8, "coord_origin": "TOPLEFT" }, "text": ": Only \"U\" cells and \"C\" cells are allowed in the first", "orig": ": Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 475.5, "r_x1": 186.0, "r_y1": 475.5, "r_x2": 186.0, "r_y2": 466.7, "r_x3": 151.7, "r_y3": 466.7, "coord_origin": "TOPLEFT" }, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 487.5, "r_x1": 146.7, "r_y1": 487.5, "r_x2": 146.7, "r_y2": 478.7, "r_x3": 139.0, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 487.5, "r_x1": 235.2, "r_y1": 487.5, "r_x2": 235.2, "r_y2": 478.7, "r_x3": 151.7, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.2, "r_y0": 487.5, "r_x1": 480.6, "r_y1": 487.5, "r_x2": 480.6, "r_y2": 478.7, "r_x3": 235.2, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 499.5, "r_x1": 448.0, "r_y1": 499.5, "r_x2": 448.0, "r_y2": 490.7, "r_x3": 151.7, "r_y3": 490.7, "coord_origin": "TOPLEFT" }, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 521.4, "r_x1": 480.6, "r_y1": 521.4, "r_x2": 480.6, "r_y2": 512.6, "r_x3": 149.7, "r_y3": 512.6, "coord_origin": "TOPLEFT" }, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.5, "r_x3": 134.8, "r_y3": 524.5, "coord_origin": "TOPLEFT" }, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 480.6, "r_y1": 581.2, "r_x2": 480.6, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 311.2, "r_y1": 640.9, "r_x2": 311.2, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 149.7, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 7, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "page_header", "bbox": { "l": 476.0, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.87, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "caption", "bbox": { "l": 134.8, "t": 125.8, "r": 480.6, "b": 155.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 133.7, "r_x1": 162.6, "r_y1": 133.7, "r_x2": 162.6, "r_y2": 125.8, "r_x3": 134.8, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.3, "r_y0": 133.9, "r_x1": 480.6, "r_y1": 133.9, "r_x2": 480.6, "r_y2": 125.9, "r_x3": 166.3, "r_y3": 125.9, "coord_origin": "TOPLEFT" }, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 144.9, "r_x1": 480.6, "r_y1": 144.9, "r_x2": 480.6, "r_y2": 136.8, "r_x3": 134.8, "r_y3": 136.8, "coord_origin": "TOPLEFT" }, "text": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "orig": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 155.8, "r_x1": 306.1, "r_y1": 155.8, "r_x2": 306.1, "r_y2": 147.8, "r_x3": 134.8, "r_y3": 147.8, "coord_origin": "TOPLEFT" }, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "picture", "bbox": { "l": 164.7, "t": 163.8, "r": 449.6, "b": 280.3, "coord_origin": "TOPLEFT" }, "confidence": 0.79, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.5, "r_y0": 177.9, "r_x1": 381.7, "r_y1": 177.9, "r_x2": 381.7, "r_y2": 168.6, "r_x3": 374.5, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 177.8, "r_x1": 405.9, "r_y1": 177.8, "r_x2": 405.9, "r_y2": 168.5, "r_x3": 398.7, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.8, "r_y0": 202.2, "r_x1": 380.9, "r_y1": 202.2, "r_x2": 380.9, "r_y2": 192.9, "r_x3": 373.8, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 202.4, "r_x1": 393.8, "r_y1": 202.4, "r_x2": 393.8, "r_y2": 193.1, "r_x3": 386.7, "r_y3": 193.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 214.5, "r_x1": 393.9, "r_y1": 214.5, "r_x2": 393.9, "r_y2": 205.1, "r_x3": 386.7, "r_y3": 205.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 190.1, "r_x1": 405.8, "r_y1": 190.1, "r_x2": 405.8, "r_y2": 180.7, "r_x3": 398.7, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.8, "r_y0": 190.1, "r_x1": 418.0, "r_y1": 190.1, "r_x2": 418.0, "r_y2": 180.7, "r_x3": 410.8, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.9, "r_y0": 190.0, "r_x1": 430.1, "r_y1": 190.0, "r_x2": 430.1, "r_y2": 180.7, "r_x3": 422.9, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 202.3, "r_x1": 406.0, "r_y1": 202.3, "r_x2": 406.0, "r_y2": 193.0, "r_x3": 398.8, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.3, "r_x1": 418.1, "r_y1": 202.3, "r_x2": 418.1, "r_y2": 193.0, "r_x3": 410.9, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 202.2, "r_x1": 430.2, "r_y1": 202.2, "r_x2": 430.2, "r_y2": 192.9, "r_x3": 423.0, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 214.6, "r_x1": 406.0, "r_y1": 214.6, "r_x2": 406.0, "r_y2": 205.3, "r_x3": 398.8, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.6, "r_x1": 418.1, "r_y1": 214.6, "r_x2": 418.1, "r_y2": 205.3, "r_x3": 410.9, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 214.6, "r_x1": 430.2, "r_y1": 214.6, "r_x2": 430.2, "r_y2": 205.2, "r_x3": 423.0, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.5, "r_y0": 226.4, "r_x1": 393.7, "r_y1": 226.4, "r_x2": 393.7, "r_y2": 217.0, "r_x3": 386.5, "r_y3": 217.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.5, "r_x1": 405.8, "r_y1": 226.5, "r_x2": 405.8, "r_y2": 217.2, "r_x3": 398.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.7, "r_y0": 226.5, "r_x1": 417.9, "r_y1": 226.5, "r_x2": 417.9, "r_y2": 217.2, "r_x3": 410.7, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.8, "r_y0": 226.5, "r_x1": 430.0, "r_y1": 226.5, "r_x2": 430.0, "r_y2": 217.1, "r_x3": 422.8, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.2, "r_y0": 177.0, "r_x1": 447.9, "r_y1": 177.0, "r_x2": 447.9, "r_y2": 167.7, "r_x3": 435.2, "r_y3": 167.7, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 189.5, "r_x1": 448.1, "r_y1": 189.5, "r_x2": 448.1, "r_y2": 180.2, "r_x3": 435.4, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 201.8, "r_x1": 448.2, "r_y1": 201.8, "r_x2": 448.2, "r_y2": 192.5, "r_x3": 435.5, "r_y3": 192.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 214.2, "r_x1": 448.1, "r_y1": 214.2, "r_x2": 448.1, "r_y2": 204.8, "r_x3": 435.4, "r_y3": 204.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.6, "r_x1": 448.3, "r_y1": 226.6, "r_x2": 448.3, "r_y2": 217.2, "r_x3": 435.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.1, "r_y0": 214.6, "r_x1": 381.3, "r_y1": 214.6, "r_x2": 381.3, "r_y2": 205.2, "r_x3": 374.1, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0, "r_y0": 226.5, "r_x1": 381.2, "r_y1": 226.5, "r_x2": 381.2, "r_y2": 217.1, "r_x3": 374.0, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.3, "r_y0": 190.3, "r_x1": 381.5, "r_y1": 190.3, "r_x2": 381.5, "r_y2": 180.9, "r_x3": 374.3, "r_y3": 180.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.8, "r_y0": 177.9, "r_x1": 393.3, "r_y1": 177.9, "r_x2": 393.3, "r_y2": 168.6, "r_x3": 387.8, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.9, "r_y0": 177.4, "r_x1": 417.4, "r_y1": 177.4, "r_x2": 417.4, "r_y2": 168.1, "r_x3": 411.9, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.3, "r_y0": 177.3, "r_x1": 428.9, "r_y1": 177.3, "r_x2": 428.9, "r_y2": 167.9, "r_x3": 423.3, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.1, "r_y0": 190.1, "r_x1": 393.8, "r_y1": 190.1, "r_x2": 393.8, "r_y2": 180.8, "r_x3": 387.1, "r_y3": 180.8, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.3, "r_y0": 253.8, "r_x1": 289.4, "r_y1": 253.8, "r_x2": 289.4, "r_y2": 244.5, "r_x3": 282.3, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.1, "r_y0": 266.2, "r_x1": 289.3, "r_y1": 266.2, "r_x2": 289.3, "r_y2": 256.9, "r_x3": 282.1, "r_y3": 256.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.4, "r_y0": 278.5, "r_x1": 289.6, "r_y1": 278.5, "r_x2": 289.6, "r_y2": 269.1, "r_x3": 282.4, "r_y3": 269.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.5, "r_y0": 253.8, "r_x1": 301.1, "r_y1": 253.8, "r_x2": 301.1, "r_y2": 244.5, "r_x3": 295.5, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.5, "r_y0": 253.9, "r_x1": 313.0, "r_y1": 253.9, "r_x2": 313.0, "r_y2": 244.6, "r_x3": 307.5, "r_y3": 244.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.8, "r_y0": 253.8, "r_x1": 324.3, "r_y1": 253.8, "r_x2": 324.3, "r_y2": 244.4, "r_x3": 318.8, "r_y3": 244.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.0, "r_x1": 301.0, "r_y1": 266.0, "r_x2": 301.0, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.2, "r_y0": 266.0, "r_x1": 325.6, "r_y1": 266.0, "r_x2": 325.6, "r_y2": 256.7, "r_x3": 307.2, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.8, "r_y0": 278.6, "r_x1": 300.9, "r_y1": 278.6, "r_x2": 300.9, "r_y2": 269.3, "r_x3": 294.8, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.1, "r_y0": 278.6, "r_x1": 325.5, "r_y1": 278.6, "r_x2": 325.5, "r_y2": 269.3, "r_x3": 307.1, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 278.1, "r_x1": 203.1, "r_y1": 278.1, "r_x2": 203.1, "r_y2": 268.7, "r_x3": 195.9, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.2, "r_y0": 278.1, "r_x1": 214.7, "r_y1": 278.1, "r_x2": 214.7, "r_y2": 268.7, "r_x3": 209.2, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.1, "r_y0": 278.1, "r_x1": 226.7, "r_y1": 278.1, "r_x2": 226.7, "r_y2": 268.8, "r_x3": 221.1, "r_y3": 268.8, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.4, "r_y0": 278.0, "r_x1": 238.0, "r_y1": 278.0, "r_x2": 238.0, "r_y2": 268.7, "r_x3": 232.4, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.2, "r_y0": 253.9, "r_x1": 203.4, "r_y1": 253.9, "r_x2": 203.4, "r_y2": 244.5, "r_x3": 196.2, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.3, "r_y0": 253.4, "r_x1": 257.5, "r_y1": 253.4, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.3, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.2, "r_y0": 265.8, "r_x1": 257.3, "r_y1": 265.8, "r_x2": 257.3, "r_y2": 256.4, "r_x3": 250.2, "r_y3": 256.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.5, "r_y0": 278.0, "r_x1": 257.6, "r_y1": 278.0, "r_x2": 257.6, "r_y2": 268.7, "r_x3": 250.5, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 249.2, "r_x1": 337.2, "r_y1": 249.2, "r_x2": 337.2, "r_y2": 243.0, "r_x3": 334.5, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.9, "r_y0": 249.2, "r_x1": 391.5, "r_y1": 249.2, "r_x2": 391.5, "r_y2": 243.0, "r_x3": 339.9, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 259.1, "r_x1": 337.3, "r_y1": 259.1, "r_x2": 337.3, "r_y2": 252.9, "r_x3": 334.5, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.2, "r_y0": 259.1, "r_x1": 422.0, "r_y1": 259.1, "r_x2": 422.0, "r_y2": 252.9, "r_x3": 340.2, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 269.1, "r_x1": 337.3, "r_y1": 269.1, "r_x2": 337.3, "r_y2": 262.9, "r_x3": 334.5, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 269.1, "r_x1": 415.3, "r_y1": 269.1, "r_x2": 415.3, "r_y2": 262.9, "r_x3": 340.1, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 279.0, "r_x1": 337.3, "r_y1": 279.0, "r_x2": 337.3, "r_y2": 272.8, "r_x3": 334.5, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 279.0, "r_x1": 426.6, "r_y1": 279.0, "r_x2": 426.6, "r_y2": 272.8, "r_x3": 340.1, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.7, "r_y0": 250.3, "r_x1": 189.4, "r_y1": 250.3, "r_x2": 189.4, "r_y2": 244.0, "r_x3": 185.7, "r_y3": 244.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.0, "r_y0": 274.6, "r_x1": 189.7, "r_y1": 274.6, "r_x2": 189.7, "r_y2": 268.3, "r_x3": 186.0, "r_y3": 268.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.3, "r_y0": 249.8, "r_x1": 243.0, "r_y1": 249.8, "r_x2": 243.0, "r_y2": 243.6, "r_x3": 239.3, "r_y3": 243.6, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 249.7, "r_x1": 275.0, "r_y1": 249.7, "r_x2": 275.0, "r_y2": 243.5, "r_x3": 271.3, "r_y3": 243.5, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.8, "r_y0": 172.7, "r_x1": 233.5, "r_y1": 172.7, "r_x2": 233.5, "r_y2": 166.5, "r_x3": 229.8, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.2, "r_y0": 196.2, "r_x1": 260.9, "r_y1": 196.2, "r_x2": 260.9, "r_y2": 190.0, "r_x3": 257.2, "r_y3": 190.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.9, "r_y0": 184.2, "r_x1": 190.6, "r_y1": 184.2, "r_x2": 190.6, "r_y2": 178.0, "r_x3": 186.9, "r_y3": 178.0, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.5, "r_y0": 175.2, "r_x1": 200.2, "r_y1": 175.2, "r_x2": 200.2, "r_y2": 169.0, "r_x3": 196.5, "r_y3": 169.0, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 175.7, "r_x1": 175.7, "r_y1": 175.7, "r_x2": 175.7, "r_y2": 167.9, "r_x3": 169.7, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 214.6, "r_x1": 175.7, "r_y1": 214.6, "r_x2": 175.7, "r_y2": 206.8, "r_x3": 169.7, "r_y3": 206.8, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.3, "r_y0": 176.0, "r_x1": 280.3, "r_y1": 176.0, "r_x2": 280.3, "r_y2": 168.3, "r_x3": 274.3, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.6, "r_y0": 176.0, "r_x1": 365.5, "r_y1": 176.0, "r_x2": 365.5, "r_y2": 168.3, "r_x3": 359.6, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 251.0, "r_x1": 175.3, "r_y1": 251.0, "r_x2": 175.3, "r_y2": 243.2, "r_x3": 169.7, "r_y3": 243.2, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 38, "label": "text", "bbox": { "l": 374.5, "t": 168.6, "r": 381.7, "b": 177.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.5, "r_y0": 177.9, "r_x1": 381.7, "r_y1": 177.9, "r_x2": 381.7, "r_y2": 168.6, "r_x3": 374.5, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 398.7, "t": 168.5, "r": 405.9, "b": 177.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 177.8, "r_x1": 405.9, "r_y1": 177.8, "r_x2": 405.9, "r_y2": 168.5, "r_x3": 398.7, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 373.8, "t": 192.9, "r": 380.9, "b": 202.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.8, "r_y0": 202.2, "r_x1": 380.9, "r_y1": 202.2, "r_x2": 380.9, "r_y2": 192.9, "r_x3": 373.8, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 386.7, "t": 193.1, "r": 393.8, "b": 202.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 202.4, "r_x1": 393.8, "r_y1": 202.4, "r_x2": 393.8, "r_y2": 193.1, "r_x3": 386.7, "r_y3": 193.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 386.7, "t": 205.1, "r": 393.9, "b": 214.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 214.5, "r_x1": 393.9, "r_y1": 214.5, "r_x2": 393.9, "r_y2": 205.1, "r_x3": 386.7, "r_y3": 205.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 398.7, "t": 180.7, "r": 405.8, "b": 190.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 190.1, "r_x1": 405.8, "r_y1": 190.1, "r_x2": 405.8, "r_y2": 180.7, "r_x3": 398.7, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 410.8, "t": 180.7, "r": 418.0, "b": 190.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.8, "r_y0": 190.1, "r_x1": 418.0, "r_y1": 190.1, "r_x2": 418.0, "r_y2": 180.7, "r_x3": 410.8, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 422.9, "t": 180.7, "r": 430.1, "b": 190.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.9, "r_y0": 190.0, "r_x1": 430.1, "r_y1": 190.0, "r_x2": 430.1, "r_y2": 180.7, "r_x3": 422.9, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 398.8, "t": 193.0, "r": 406.0, "b": 202.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 202.3, "r_x1": 406.0, "r_y1": 202.3, "r_x2": 406.0, "r_y2": 193.0, "r_x3": 398.8, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 410.9, "t": 193.0, "r": 418.1, "b": 202.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.3, "r_x1": 418.1, "r_y1": 202.3, "r_x2": 418.1, "r_y2": 193.0, "r_x3": 410.9, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 423.0, "t": 192.9, "r": 430.2, "b": 202.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 202.2, "r_x1": 430.2, "r_y1": 202.2, "r_x2": 430.2, "r_y2": 192.9, "r_x3": 423.0, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 398.8, "t": 205.3, "r": 406.0, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 214.6, "r_x1": 406.0, "r_y1": 214.6, "r_x2": 406.0, "r_y2": 205.3, "r_x3": 398.8, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 410.9, "t": 205.3, "r": 418.1, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.6, "r_x1": 418.1, "r_y1": 214.6, "r_x2": 418.1, "r_y2": 205.3, "r_x3": 410.9, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 423.0, "t": 205.2, "r": 430.2, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 214.6, "r_x1": 430.2, "r_y1": 214.6, "r_x2": 430.2, "r_y2": 205.2, "r_x3": 423.0, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 386.5, "t": 217.0, "r": 393.7, "b": 226.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.5, "r_y0": 226.4, "r_x1": 393.7, "r_y1": 226.4, "r_x2": 393.7, "r_y2": 217.0, "r_x3": 386.5, "r_y3": 217.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 398.6, "t": 217.2, "r": 405.8, "b": 226.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.5, "r_x1": 405.8, "r_y1": 226.5, "r_x2": 405.8, "r_y2": 217.2, "r_x3": 398.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 410.7, "t": 217.2, "r": 417.9, "b": 226.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.7, "r_y0": 226.5, "r_x1": 417.9, "r_y1": 226.5, "r_x2": 417.9, "r_y2": 217.2, "r_x3": 410.7, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 422.8, "t": 217.1, "r": 430.0, "b": 226.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.8, "r_y0": 226.5, "r_x1": 430.0, "r_y1": 226.5, "r_x2": 430.0, "r_y2": 217.1, "r_x3": 422.8, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 435.2, "t": 167.7, "r": 447.9, "b": 177.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.2, "r_y0": 177.0, "r_x1": 447.9, "r_y1": 177.0, "r_x2": 447.9, "r_y2": 167.7, "r_x3": 435.2, "r_y3": 167.7, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 435.4, "t": 180.2, "r": 448.1, "b": 189.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 189.5, "r_x1": 448.1, "r_y1": 189.5, "r_x2": 448.1, "r_y2": 180.2, "r_x3": 435.4, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 435.5, "t": 192.5, "r": 448.2, "b": 201.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 201.8, "r_x1": 448.2, "r_y1": 201.8, "r_x2": 448.2, "r_y2": 192.5, "r_x3": 435.5, "r_y3": 192.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 435.4, "t": 204.8, "r": 448.1, "b": 214.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 214.2, "r_x1": 448.1, "r_y1": 214.2, "r_x2": 448.1, "r_y2": 204.8, "r_x3": 435.4, "r_y3": 204.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 435.6, "t": 217.2, "r": 448.3, "b": 226.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.6, "r_x1": 448.3, "r_y1": 226.6, "r_x2": 448.3, "r_y2": 217.2, "r_x3": 435.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 374.1, "t": 205.2, "r": 381.3, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.1, "r_y0": 214.6, "r_x1": 381.3, "r_y1": 214.6, "r_x2": 381.3, "r_y2": 205.2, "r_x3": 374.1, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 374.0, "t": 217.1, "r": 381.2, "b": 226.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0, "r_y0": 226.5, "r_x1": 381.2, "r_y1": 226.5, "r_x2": 381.2, "r_y2": 217.1, "r_x3": 374.0, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 374.3, "t": 180.9, "r": 381.5, "b": 190.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.3, "r_y0": 190.3, "r_x1": 381.5, "r_y1": 190.3, "r_x2": 381.5, "r_y2": 180.9, "r_x3": 374.3, "r_y3": 180.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 387.8, "t": 168.6, "r": 393.3, "b": 177.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.8, "r_y0": 177.9, "r_x1": 393.3, "r_y1": 177.9, "r_x2": 393.3, "r_y2": 168.6, "r_x3": 387.8, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 411.9, "t": 168.1, "r": 417.4, "b": 177.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.9, "r_y0": 177.4, "r_x1": 417.4, "r_y1": 177.4, "r_x2": 417.4, "r_y2": 168.1, "r_x3": 411.9, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 423.3, "t": 167.9, "r": 428.9, "b": 177.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.3, "r_y0": 177.3, "r_x1": 428.9, "r_y1": 177.3, "r_x2": 428.9, "r_y2": 167.9, "r_x3": 423.3, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 387.1, "t": 180.8, "r": 393.8, "b": 190.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.1, "r_y0": 190.1, "r_x1": 393.8, "r_y1": 190.1, "r_x2": 393.8, "r_y2": 180.8, "r_x3": 387.1, "r_y3": 180.8, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 282.3, "t": 244.5, "r": 289.4, "b": 253.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.3, "r_y0": 253.8, "r_x1": 289.4, "r_y1": 253.8, "r_x2": 289.4, "r_y2": 244.5, "r_x3": 282.3, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 282.1, "t": 256.9, "r": 289.3, "b": 266.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.1, "r_y0": 266.2, "r_x1": 289.3, "r_y1": 266.2, "r_x2": 289.3, "r_y2": 256.9, "r_x3": 282.1, "r_y3": 256.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 282.4, "t": 269.1, "r": 289.6, "b": 278.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.4, "r_y0": 278.5, "r_x1": 289.6, "r_y1": 278.5, "r_x2": 289.6, "r_y2": 269.1, "r_x3": 282.4, "r_y3": 269.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 295.5, "t": 244.5, "r": 301.1, "b": 253.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.5, "r_y0": 253.8, "r_x1": 301.1, "r_y1": 253.8, "r_x2": 301.1, "r_y2": 244.5, "r_x3": 295.5, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 307.5, "t": 244.6, "r": 313.0, "b": 253.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.5, "r_y0": 253.9, "r_x1": 313.0, "r_y1": 253.9, "r_x2": 313.0, "r_y2": 244.6, "r_x3": 307.5, "r_y3": 244.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 318.8, "t": 244.4, "r": 324.3, "b": 253.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.8, "r_y0": 253.8, "r_x1": 324.3, "r_y1": 253.8, "r_x2": 324.3, "r_y2": 244.4, "r_x3": 318.8, "r_y3": 244.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 294.9, "t": 256.7, "r": 301.0, "b": 266.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.0, "r_x1": 301.0, "r_y1": 266.0, "r_x2": 301.0, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 307.2, "t": 256.7, "r": 325.6, "b": 266.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.2, "r_y0": 266.0, "r_x1": 325.6, "r_y1": 266.0, "r_x2": 325.6, "r_y2": 256.7, "r_x3": 307.2, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 294.8, "t": 269.3, "r": 300.9, "b": 278.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.8, "r_y0": 278.6, "r_x1": 300.9, "r_y1": 278.6, "r_x2": 300.9, "r_y2": 269.3, "r_x3": 294.8, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 307.1, "t": 269.3, "r": 325.5, "b": 278.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.1, "r_y0": 278.6, "r_x1": 325.5, "r_y1": 278.6, "r_x2": 325.5, "r_y2": 269.3, "r_x3": 307.1, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 195.9, "t": 268.7, "r": 203.1, "b": 278.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 278.1, "r_x1": 203.1, "r_y1": 278.1, "r_x2": 203.1, "r_y2": 268.7, "r_x3": 195.9, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 209.2, "t": 268.7, "r": 214.7, "b": 278.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.2, "r_y0": 278.1, "r_x1": 214.7, "r_y1": 278.1, "r_x2": 214.7, "r_y2": 268.7, "r_x3": 209.2, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 221.1, "t": 268.8, "r": 226.7, "b": 278.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.1, "r_y0": 278.1, "r_x1": 226.7, "r_y1": 278.1, "r_x2": 226.7, "r_y2": 268.8, "r_x3": 221.1, "r_y3": 268.8, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.4, "t": 268.7, "r": 238.0, "b": 278.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.4, "r_y0": 278.0, "r_x1": 238.0, "r_y1": 278.0, "r_x2": 238.0, "r_y2": 268.7, "r_x3": 232.4, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 196.2, "t": 244.5, "r": 203.4, "b": 253.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.2, "r_y0": 253.9, "r_x1": 203.4, "r_y1": 253.9, "r_x2": 203.4, "r_y2": 244.5, "r_x3": 196.2, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 250.3, "t": 244.1, "r": 257.5, "b": 253.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.3, "r_y0": 253.4, "r_x1": 257.5, "r_y1": 253.4, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.3, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 250.2, "t": 256.4, "r": 257.3, "b": 265.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.2, "r_y0": 265.8, "r_x1": 257.3, "r_y1": 265.8, "r_x2": 257.3, "r_y2": 256.4, "r_x3": 250.2, "r_y3": 256.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 250.5, "t": 268.7, "r": 257.6, "b": 278.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.5, "r_y0": 278.0, "r_x1": 257.6, "r_y1": 278.0, "r_x2": 257.6, "r_y2": 268.7, "r_x3": 250.5, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 334.5, "t": 243.0, "r": 337.2, "b": 249.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 249.2, "r_x1": 337.2, "r_y1": 249.2, "r_x2": 337.2, "r_y2": 243.0, "r_x3": 334.5, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 339.9, "t": 243.0, "r": 391.5, "b": 249.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.9, "r_y0": 249.2, "r_x1": 391.5, "r_y1": 249.2, "r_x2": 391.5, "r_y2": 243.0, "r_x3": 339.9, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 334.5, "t": 252.9, "r": 337.3, "b": 259.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 259.1, "r_x1": 337.3, "r_y1": 259.1, "r_x2": 337.3, "r_y2": 252.9, "r_x3": 334.5, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 340.2, "t": 252.9, "r": 422.0, "b": 259.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.2, "r_y0": 259.1, "r_x1": 422.0, "r_y1": 259.1, "r_x2": 422.0, "r_y2": 252.9, "r_x3": 340.2, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 334.5, "t": 262.9, "r": 337.3, "b": 269.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 269.1, "r_x1": 337.3, "r_y1": 269.1, "r_x2": 337.3, "r_y2": 262.9, "r_x3": 334.5, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 340.1, "t": 262.9, "r": 415.3, "b": 269.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 269.1, "r_x1": 415.3, "r_y1": 269.1, "r_x2": 415.3, "r_y2": 262.9, "r_x3": 340.1, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 334.5, "t": 272.8, "r": 426.6, "b": 279.0, "coord_origin": "TOPLEFT" }, "confidence": 0.53, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 279.0, "r_x1": 337.3, "r_y1": 279.0, "r_x2": 337.3, "r_y2": 272.8, "r_x3": 334.5, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 279.0, "r_x1": 426.6, "r_y1": 279.0, "r_x2": 426.6, "r_y2": 272.8, "r_x3": 340.1, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 185.7, "t": 244.0, "r": 189.4, "b": 250.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.7, "r_y0": 250.3, "r_x1": 189.4, "r_y1": 250.3, "r_x2": 189.4, "r_y2": 244.0, "r_x3": 185.7, "r_y3": 244.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 186.0, "t": 268.3, "r": 189.7, "b": 274.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.0, "r_y0": 274.6, "r_x1": 189.7, "r_y1": 274.6, "r_x2": 189.7, "r_y2": 268.3, "r_x3": 186.0, "r_y3": 268.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 239.3, "t": 243.6, "r": 243.0, "b": 249.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.3, "r_y0": 249.8, "r_x1": 243.0, "r_y1": 249.8, "r_x2": 243.0, "r_y2": 243.6, "r_x3": 239.3, "r_y3": 243.6, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 271.3, "t": 243.5, "r": 275.0, "b": 249.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 249.7, "r_x1": 275.0, "r_y1": 249.7, "r_x2": 275.0, "r_y2": 243.5, "r_x3": 271.3, "r_y3": 243.5, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 229.8, "t": 166.5, "r": 233.5, "b": 172.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.8, "r_y0": 172.7, "r_x1": 233.5, "r_y1": 172.7, "r_x2": 233.5, "r_y2": 166.5, "r_x3": 229.8, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 257.2, "t": 190.0, "r": 260.9, "b": 196.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.2, "r_y0": 196.2, "r_x1": 260.9, "r_y1": 196.2, "r_x2": 260.9, "r_y2": 190.0, "r_x3": 257.2, "r_y3": 190.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 186.9, "t": 178.0, "r": 190.6, "b": 184.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.9, "r_y0": 184.2, "r_x1": 190.6, "r_y1": 184.2, "r_x2": 190.6, "r_y2": 178.0, "r_x3": 186.9, "r_y3": 178.0, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 196.5, "t": 169.0, "r": 200.2, "b": 175.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.5, "r_y0": 175.2, "r_x1": 200.2, "r_y1": 175.2, "r_x2": 200.2, "r_y2": 169.0, "r_x3": 196.5, "r_y3": 169.0, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 169.7, "t": 167.9, "r": 175.7, "b": 175.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 175.7, "r_x1": 175.7, "r_y1": 175.7, "r_x2": 175.7, "r_y2": 167.9, "r_x3": 169.7, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 169.7, "t": 206.8, "r": 175.7, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 214.6, "r_x1": 175.7, "r_y1": 214.6, "r_x2": 175.7, "r_y2": 206.8, "r_x3": 169.7, "r_y3": 206.8, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 274.3, "t": 168.3, "r": 280.3, "b": 176.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.3, "r_y0": 176.0, "r_x1": 280.3, "r_y1": 176.0, "r_x2": 280.3, "r_y2": 168.3, "r_x3": 274.3, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 359.6, "t": 168.3, "r": 365.5, "b": 176.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.6, "r_y0": 176.0, "r_x1": 365.5, "r_y1": 176.0, "r_x2": 365.5, "r_y2": 168.3, "r_x3": 359.6, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 169.7, "t": 243.2, "r": 175.3, "b": 251.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 251.0, "r_x1": 175.3, "r_y1": 251.0, "r_x2": 175.3, "r_y2": 243.2, "r_x3": 169.7, "r_y3": 243.2, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 9, "label": "section_header", "bbox": { "l": 134.8, "t": 305.3, "r": 246.7, "b": 314.1, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 314.1, "r_x1": 149.4, "r_y1": 314.1, "r_x2": 149.4, "r_y2": 305.3, "r_x3": 134.8, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 314.1, "r_x1": 246.7, "r_y1": 314.1, "r_x2": 246.7, "r_y2": 305.3, "r_x3": 160.9, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "text", "bbox": { "l": 134.8, "t": 325.2, "r": 363.8, "b": 334.0, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 334.0, "r_x1": 363.8, "r_y1": 334.0, "r_x2": 363.8, "r_y2": 325.2, "r_x3": 134.8, "r_y3": 325.2, "coord_origin": "TOPLEFT" }, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 139.0, "t": 347.2, "r": 480.6, "b": 367.9, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 356.0, "r_x1": 146.7, "r_y1": 356.0, "r_x2": 146.7, "r_y2": 347.2, "r_x3": 139.0, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 356.0, "r_x1": 257.4, "r_y1": 356.0, "r_x2": 257.4, "r_y2": 347.2, "r_x3": 151.7, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.4, "r_y0": 356.0, "r_x1": 480.6, "r_y1": 356.0, "r_x2": 480.6, "r_y2": 347.2, "r_x3": 257.4, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": ": The left neighbour of an \"L\" cell must be either", "orig": ": The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 367.9, "r_x1": 283.6, "r_y1": 367.9, "r_x2": 283.6, "r_y2": 359.1, "r_x3": 151.7, "r_y3": 359.1, "coord_origin": "TOPLEFT" }, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 139.0, "t": 371.1, "r": 480.6, "b": 391.8, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 379.9, "r_x1": 146.7, "r_y1": 379.9, "r_x2": 146.7, "r_y2": 371.1, "r_x3": 139.0, "r_y3": 371.1, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 379.9, "r_x1": 252.1, "r_y1": 379.9, "r_x2": 252.1, "r_y2": 371.1, "r_x3": 151.7, "r_y3": 371.1, "coord_origin": "TOPLEFT" }, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.1, "r_y0": 379.9, "r_x1": 480.6, "r_y1": 379.9, "r_x2": 480.6, "r_y2": 371.1, "r_x3": 252.1, "r_y3": 371.1, "coord_origin": "TOPLEFT" }, "text": ": The upper neighbour of a \"U\" cell must be either", "orig": ": The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 391.8, "r_x1": 284.8, "r_y1": 391.8, "r_x2": 284.8, "r_y2": 383.0, "r_x3": 151.7, "r_y3": 383.0, "coord_origin": "TOPLEFT" }, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "section_header", "bbox": { "l": 139.0, "t": 395.0, "r": 226.1, "b": 403.8, "coord_origin": "TOPLEFT" }, "confidence": 0.65, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 403.8, "r_x1": 146.7, "r_y1": 403.8, "r_x2": 146.7, "r_y2": 395.0, "r_x3": 139.0, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 403.8, "r_x1": 223.3, "r_y1": 403.8, "r_x2": 223.3, "r_y2": 395.0, "r_x3": 151.7, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.3, "r_y0": 403.8, "r_x1": 226.1, "r_y1": 403.8, "r_x2": 226.1, "r_y2": 395.0, "r_x3": 223.3, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "list_item", "bbox": { "l": 151.7, "t": 407.0, "r": 480.6, "b": 439.7, "coord_origin": "TOPLEFT" }, "confidence": 0.72, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 415.8, "r_x1": 480.6, "r_y1": 415.8, "r_x2": 480.6, "r_y2": 407.0, "r_x3": 151.7, "r_y3": 407.0, "coord_origin": "TOPLEFT" }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 427.7, "r_x1": 480.6, "r_y1": 427.7, "r_x2": 480.6, "r_y2": 418.9, "r_x3": 151.7, "r_y3": 418.9, "coord_origin": "TOPLEFT" }, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 439.7, "r_x1": 214.4, "r_y1": 439.7, "r_x2": 214.4, "r_y2": 430.9, "r_x3": 151.7, "r_y3": 430.9, "coord_origin": "TOPLEFT" }, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 139.0, "t": 442.8, "r": 474.6, "b": 451.6, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 451.6, "r_x1": 146.7, "r_y1": 451.6, "r_x2": 146.7, "r_y2": 442.8, "r_x3": 139.0, "r_y3": 442.8, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 451.6, "r_x1": 221.3, "r_y1": 451.6, "r_x2": 221.3, "r_y2": 442.8, "r_x3": 151.7, "r_y3": 442.8, "coord_origin": "TOPLEFT" }, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.3, "r_y0": 451.6, "r_x1": 474.6, "r_y1": 451.6, "r_x2": 474.6, "r_y2": 442.8, "r_x3": 221.3, "r_y3": 442.8, "coord_origin": "TOPLEFT" }, "text": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 139.0, "t": 454.8, "r": 480.6, "b": 475.5, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 463.6, "r_x1": 146.7, "r_y1": 463.6, "r_x2": 146.7, "r_y2": 454.8, "r_x3": 139.0, "r_y3": 454.8, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 463.6, "r_x1": 240.7, "r_y1": 463.6, "r_x2": 240.7, "r_y2": 454.8, "r_x3": 151.7, "r_y3": 454.8, "coord_origin": "TOPLEFT" }, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.7, "r_y0": 463.6, "r_x1": 480.6, "r_y1": 463.6, "r_x2": 480.6, "r_y2": 454.8, "r_x3": 240.7, "r_y3": 454.8, "coord_origin": "TOPLEFT" }, "text": ": Only \"U\" cells and \"C\" cells are allowed in the first", "orig": ": Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 475.5, "r_x1": 186.0, "r_y1": 475.5, "r_x2": 186.0, "r_y2": 466.7, "r_x3": 151.7, "r_y3": 466.7, "coord_origin": "TOPLEFT" }, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "list_item", "bbox": { "l": 139.0, "t": 478.7, "r": 480.6, "b": 499.5, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 487.5, "r_x1": 146.7, "r_y1": 487.5, "r_x2": 146.7, "r_y2": 478.7, "r_x3": 139.0, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 487.5, "r_x1": 235.2, "r_y1": 487.5, "r_x2": 235.2, "r_y2": 478.7, "r_x3": 151.7, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.2, "r_y0": 487.5, "r_x1": 480.6, "r_y1": 487.5, "r_x2": 480.6, "r_y2": 478.7, "r_x3": 235.2, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 499.5, "r_x1": 448.0, "r_y1": 499.5, "r_x2": 448.0, "r_y2": 490.7, "r_x3": 151.7, "r_y3": 490.7, "coord_origin": "TOPLEFT" }, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 512.6, "r": 480.6, "b": 640.9, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 521.4, "r_x1": 480.6, "r_y1": 521.4, "r_x2": 480.6, "r_y2": 512.6, "r_x3": 149.7, "r_y3": 512.6, "coord_origin": "TOPLEFT" }, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.5, "r_x3": 134.8, "r_y3": 524.5, "coord_origin": "TOPLEFT" }, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 480.6, "r_y1": 581.2, "r_x2": 480.6, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 311.2, "r_y1": 640.9, "r_x2": 311.2, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 644.1, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 149.7, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 7, "page_no": 6, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 11, "page_no": 6, "cluster": { "id": 11, "label": "page_header", "bbox": { "l": 476.0, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.87, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7" }, { "label": "caption", "id": 6, "page_no": 6, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 134.8, "t": 125.8, "r": 480.6, "b": 155.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 133.7, "r_x1": 162.6, "r_y1": 133.7, "r_x2": 162.6, "r_y2": 125.8, "r_x3": 134.8, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.3, "r_y0": 133.9, "r_x1": 480.6, "r_y1": 133.9, "r_x2": 480.6, "r_y2": 125.9, "r_x3": 166.3, "r_y3": 125.9, "coord_origin": "TOPLEFT" }, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 144.9, "r_x1": 480.6, "r_y1": 144.9, "r_x2": 480.6, "r_y2": 136.8, "r_x3": 134.8, "r_y3": 136.8, "coord_origin": "TOPLEFT" }, "text": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "orig": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 155.8, "r_x1": 306.1, "r_y1": 155.8, "r_x2": 306.1, "r_y2": 147.8, "r_x3": 134.8, "r_y3": 147.8, "coord_origin": "TOPLEFT" }, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 3. OTSL description of table structure: A - table example; B - graphical representation of table structure; C - mapping structure on a grid; D - OTSL structure encoding; E - explanation on cell encoding" }, { "label": "picture", "id": 12, "page_no": 6, "cluster": { "id": 12, "label": "picture", "bbox": { "l": 164.7, "t": 163.8, "r": 449.6, "b": 280.3, "coord_origin": "TOPLEFT" }, "confidence": 0.79, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.5, "r_y0": 177.9, "r_x1": 381.7, "r_y1": 177.9, "r_x2": 381.7, "r_y2": 168.6, "r_x3": 374.5, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 177.8, "r_x1": 405.9, "r_y1": 177.8, "r_x2": 405.9, "r_y2": 168.5, "r_x3": 398.7, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.8, "r_y0": 202.2, "r_x1": 380.9, "r_y1": 202.2, "r_x2": 380.9, "r_y2": 192.9, "r_x3": 373.8, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 202.4, "r_x1": 393.8, "r_y1": 202.4, "r_x2": 393.8, "r_y2": 193.1, "r_x3": 386.7, "r_y3": 193.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 214.5, "r_x1": 393.9, "r_y1": 214.5, "r_x2": 393.9, "r_y2": 205.1, "r_x3": 386.7, "r_y3": 205.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 190.1, "r_x1": 405.8, "r_y1": 190.1, "r_x2": 405.8, "r_y2": 180.7, "r_x3": 398.7, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.8, "r_y0": 190.1, "r_x1": 418.0, "r_y1": 190.1, "r_x2": 418.0, "r_y2": 180.7, "r_x3": 410.8, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.9, "r_y0": 190.0, "r_x1": 430.1, "r_y1": 190.0, "r_x2": 430.1, "r_y2": 180.7, "r_x3": 422.9, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 202.3, "r_x1": 406.0, "r_y1": 202.3, "r_x2": 406.0, "r_y2": 193.0, "r_x3": 398.8, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.3, "r_x1": 418.1, "r_y1": 202.3, "r_x2": 418.1, "r_y2": 193.0, "r_x3": 410.9, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 202.2, "r_x1": 430.2, "r_y1": 202.2, "r_x2": 430.2, "r_y2": 192.9, "r_x3": 423.0, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 214.6, "r_x1": 406.0, "r_y1": 214.6, "r_x2": 406.0, "r_y2": 205.3, "r_x3": 398.8, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.6, "r_x1": 418.1, "r_y1": 214.6, "r_x2": 418.1, "r_y2": 205.3, "r_x3": 410.9, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 214.6, "r_x1": 430.2, "r_y1": 214.6, "r_x2": 430.2, "r_y2": 205.2, "r_x3": 423.0, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.5, "r_y0": 226.4, "r_x1": 393.7, "r_y1": 226.4, "r_x2": 393.7, "r_y2": 217.0, "r_x3": 386.5, "r_y3": 217.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.5, "r_x1": 405.8, "r_y1": 226.5, "r_x2": 405.8, "r_y2": 217.2, "r_x3": 398.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.7, "r_y0": 226.5, "r_x1": 417.9, "r_y1": 226.5, "r_x2": 417.9, "r_y2": 217.2, "r_x3": 410.7, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.8, "r_y0": 226.5, "r_x1": 430.0, "r_y1": 226.5, "r_x2": 430.0, "r_y2": 217.1, "r_x3": 422.8, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.2, "r_y0": 177.0, "r_x1": 447.9, "r_y1": 177.0, "r_x2": 447.9, "r_y2": 167.7, "r_x3": 435.2, "r_y3": 167.7, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 189.5, "r_x1": 448.1, "r_y1": 189.5, "r_x2": 448.1, "r_y2": 180.2, "r_x3": 435.4, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 201.8, "r_x1": 448.2, "r_y1": 201.8, "r_x2": 448.2, "r_y2": 192.5, "r_x3": 435.5, "r_y3": 192.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 214.2, "r_x1": 448.1, "r_y1": 214.2, "r_x2": 448.1, "r_y2": 204.8, "r_x3": 435.4, "r_y3": 204.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.6, "r_x1": 448.3, "r_y1": 226.6, "r_x2": 448.3, "r_y2": 217.2, "r_x3": 435.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.1, "r_y0": 214.6, "r_x1": 381.3, "r_y1": 214.6, "r_x2": 381.3, "r_y2": 205.2, "r_x3": 374.1, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0, "r_y0": 226.5, "r_x1": 381.2, "r_y1": 226.5, "r_x2": 381.2, "r_y2": 217.1, "r_x3": 374.0, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.3, "r_y0": 190.3, "r_x1": 381.5, "r_y1": 190.3, "r_x2": 381.5, "r_y2": 180.9, "r_x3": 374.3, "r_y3": 180.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.8, "r_y0": 177.9, "r_x1": 393.3, "r_y1": 177.9, "r_x2": 393.3, "r_y2": 168.6, "r_x3": 387.8, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.9, "r_y0": 177.4, "r_x1": 417.4, "r_y1": 177.4, "r_x2": 417.4, "r_y2": 168.1, "r_x3": 411.9, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.3, "r_y0": 177.3, "r_x1": 428.9, "r_y1": 177.3, "r_x2": 428.9, "r_y2": 167.9, "r_x3": 423.3, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.1, "r_y0": 190.1, "r_x1": 393.8, "r_y1": 190.1, "r_x2": 393.8, "r_y2": 180.8, "r_x3": 387.1, "r_y3": 180.8, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.3, "r_y0": 253.8, "r_x1": 289.4, "r_y1": 253.8, "r_x2": 289.4, "r_y2": 244.5, "r_x3": 282.3, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.1, "r_y0": 266.2, "r_x1": 289.3, "r_y1": 266.2, "r_x2": 289.3, "r_y2": 256.9, "r_x3": 282.1, "r_y3": 256.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.4, "r_y0": 278.5, "r_x1": 289.6, "r_y1": 278.5, "r_x2": 289.6, "r_y2": 269.1, "r_x3": 282.4, "r_y3": 269.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.5, "r_y0": 253.8, "r_x1": 301.1, "r_y1": 253.8, "r_x2": 301.1, "r_y2": 244.5, "r_x3": 295.5, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.5, "r_y0": 253.9, "r_x1": 313.0, "r_y1": 253.9, "r_x2": 313.0, "r_y2": 244.6, "r_x3": 307.5, "r_y3": 244.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.8, "r_y0": 253.8, "r_x1": 324.3, "r_y1": 253.8, "r_x2": 324.3, "r_y2": 244.4, "r_x3": 318.8, "r_y3": 244.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.0, "r_x1": 301.0, "r_y1": 266.0, "r_x2": 301.0, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.2, "r_y0": 266.0, "r_x1": 325.6, "r_y1": 266.0, "r_x2": 325.6, "r_y2": 256.7, "r_x3": 307.2, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.8, "r_y0": 278.6, "r_x1": 300.9, "r_y1": 278.6, "r_x2": 300.9, "r_y2": 269.3, "r_x3": 294.8, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.1, "r_y0": 278.6, "r_x1": 325.5, "r_y1": 278.6, "r_x2": 325.5, "r_y2": 269.3, "r_x3": 307.1, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 278.1, "r_x1": 203.1, "r_y1": 278.1, "r_x2": 203.1, "r_y2": 268.7, "r_x3": 195.9, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.2, "r_y0": 278.1, "r_x1": 214.7, "r_y1": 278.1, "r_x2": 214.7, "r_y2": 268.7, "r_x3": 209.2, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.1, "r_y0": 278.1, "r_x1": 226.7, "r_y1": 278.1, "r_x2": 226.7, "r_y2": 268.8, "r_x3": 221.1, "r_y3": 268.8, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.4, "r_y0": 278.0, "r_x1": 238.0, "r_y1": 278.0, "r_x2": 238.0, "r_y2": 268.7, "r_x3": 232.4, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.2, "r_y0": 253.9, "r_x1": 203.4, "r_y1": 253.9, "r_x2": 203.4, "r_y2": 244.5, "r_x3": 196.2, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.3, "r_y0": 253.4, "r_x1": 257.5, "r_y1": 253.4, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.3, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.2, "r_y0": 265.8, "r_x1": 257.3, "r_y1": 265.8, "r_x2": 257.3, "r_y2": 256.4, "r_x3": 250.2, "r_y3": 256.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.5, "r_y0": 278.0, "r_x1": 257.6, "r_y1": 278.0, "r_x2": 257.6, "r_y2": 268.7, "r_x3": 250.5, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 249.2, "r_x1": 337.2, "r_y1": 249.2, "r_x2": 337.2, "r_y2": 243.0, "r_x3": 334.5, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.9, "r_y0": 249.2, "r_x1": 391.5, "r_y1": 249.2, "r_x2": 391.5, "r_y2": 243.0, "r_x3": 339.9, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 259.1, "r_x1": 337.3, "r_y1": 259.1, "r_x2": 337.3, "r_y2": 252.9, "r_x3": 334.5, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.2, "r_y0": 259.1, "r_x1": 422.0, "r_y1": 259.1, "r_x2": 422.0, "r_y2": 252.9, "r_x3": 340.2, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 269.1, "r_x1": 337.3, "r_y1": 269.1, "r_x2": 337.3, "r_y2": 262.9, "r_x3": 334.5, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 269.1, "r_x1": 415.3, "r_y1": 269.1, "r_x2": 415.3, "r_y2": 262.9, "r_x3": 340.1, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 279.0, "r_x1": 337.3, "r_y1": 279.0, "r_x2": 337.3, "r_y2": 272.8, "r_x3": 334.5, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 279.0, "r_x1": 426.6, "r_y1": 279.0, "r_x2": 426.6, "r_y2": 272.8, "r_x3": 340.1, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.7, "r_y0": 250.3, "r_x1": 189.4, "r_y1": 250.3, "r_x2": 189.4, "r_y2": 244.0, "r_x3": 185.7, "r_y3": 244.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.0, "r_y0": 274.6, "r_x1": 189.7, "r_y1": 274.6, "r_x2": 189.7, "r_y2": 268.3, "r_x3": 186.0, "r_y3": 268.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.3, "r_y0": 249.8, "r_x1": 243.0, "r_y1": 249.8, "r_x2": 243.0, "r_y2": 243.6, "r_x3": 239.3, "r_y3": 243.6, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 249.7, "r_x1": 275.0, "r_y1": 249.7, "r_x2": 275.0, "r_y2": 243.5, "r_x3": 271.3, "r_y3": 243.5, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.8, "r_y0": 172.7, "r_x1": 233.5, "r_y1": 172.7, "r_x2": 233.5, "r_y2": 166.5, "r_x3": 229.8, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.2, "r_y0": 196.2, "r_x1": 260.9, "r_y1": 196.2, "r_x2": 260.9, "r_y2": 190.0, "r_x3": 257.2, "r_y3": 190.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.9, "r_y0": 184.2, "r_x1": 190.6, "r_y1": 184.2, "r_x2": 190.6, "r_y2": 178.0, "r_x3": 186.9, "r_y3": 178.0, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.5, "r_y0": 175.2, "r_x1": 200.2, "r_y1": 175.2, "r_x2": 200.2, "r_y2": 169.0, "r_x3": 196.5, "r_y3": 169.0, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 175.7, "r_x1": 175.7, "r_y1": 175.7, "r_x2": 175.7, "r_y2": 167.9, "r_x3": 169.7, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 214.6, "r_x1": 175.7, "r_y1": 214.6, "r_x2": 175.7, "r_y2": 206.8, "r_x3": 169.7, "r_y3": 206.8, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.3, "r_y0": 176.0, "r_x1": 280.3, "r_y1": 176.0, "r_x2": 280.3, "r_y2": 168.3, "r_x3": 274.3, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.6, "r_y0": 176.0, "r_x1": 365.5, "r_y1": 176.0, "r_x2": 365.5, "r_y2": 168.3, "r_x3": 359.6, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 251.0, "r_x1": 175.3, "r_y1": 251.0, "r_x2": 175.3, "r_y2": 243.2, "r_x3": 169.7, "r_y3": 243.2, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 38, "label": "text", "bbox": { "l": 374.5, "t": 168.6, "r": 381.7, "b": 177.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.5, "r_y0": 177.9, "r_x1": 381.7, "r_y1": 177.9, "r_x2": 381.7, "r_y2": 168.6, "r_x3": 374.5, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 398.7, "t": 168.5, "r": 405.9, "b": 177.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 177.8, "r_x1": 405.9, "r_y1": 177.8, "r_x2": 405.9, "r_y2": 168.5, "r_x3": 398.7, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 373.8, "t": 192.9, "r": 380.9, "b": 202.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.8, "r_y0": 202.2, "r_x1": 380.9, "r_y1": 202.2, "r_x2": 380.9, "r_y2": 192.9, "r_x3": 373.8, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 386.7, "t": 193.1, "r": 393.8, "b": 202.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 202.4, "r_x1": 393.8, "r_y1": 202.4, "r_x2": 393.8, "r_y2": 193.1, "r_x3": 386.7, "r_y3": 193.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 386.7, "t": 205.1, "r": 393.9, "b": 214.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 214.5, "r_x1": 393.9, "r_y1": 214.5, "r_x2": 393.9, "r_y2": 205.1, "r_x3": 386.7, "r_y3": 205.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 398.7, "t": 180.7, "r": 405.8, "b": 190.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 190.1, "r_x1": 405.8, "r_y1": 190.1, "r_x2": 405.8, "r_y2": 180.7, "r_x3": 398.7, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 410.8, "t": 180.7, "r": 418.0, "b": 190.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.8, "r_y0": 190.1, "r_x1": 418.0, "r_y1": 190.1, "r_x2": 418.0, "r_y2": 180.7, "r_x3": 410.8, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 422.9, "t": 180.7, "r": 430.1, "b": 190.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.9, "r_y0": 190.0, "r_x1": 430.1, "r_y1": 190.0, "r_x2": 430.1, "r_y2": 180.7, "r_x3": 422.9, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 398.8, "t": 193.0, "r": 406.0, "b": 202.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 202.3, "r_x1": 406.0, "r_y1": 202.3, "r_x2": 406.0, "r_y2": 193.0, "r_x3": 398.8, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 410.9, "t": 193.0, "r": 418.1, "b": 202.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.3, "r_x1": 418.1, "r_y1": 202.3, "r_x2": 418.1, "r_y2": 193.0, "r_x3": 410.9, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 423.0, "t": 192.9, "r": 430.2, "b": 202.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 202.2, "r_x1": 430.2, "r_y1": 202.2, "r_x2": 430.2, "r_y2": 192.9, "r_x3": 423.0, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 398.8, "t": 205.3, "r": 406.0, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 214.6, "r_x1": 406.0, "r_y1": 214.6, "r_x2": 406.0, "r_y2": 205.3, "r_x3": 398.8, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 410.9, "t": 205.3, "r": 418.1, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.6, "r_x1": 418.1, "r_y1": 214.6, "r_x2": 418.1, "r_y2": 205.3, "r_x3": 410.9, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 423.0, "t": 205.2, "r": 430.2, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 214.6, "r_x1": 430.2, "r_y1": 214.6, "r_x2": 430.2, "r_y2": 205.2, "r_x3": 423.0, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 386.5, "t": 217.0, "r": 393.7, "b": 226.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.5, "r_y0": 226.4, "r_x1": 393.7, "r_y1": 226.4, "r_x2": 393.7, "r_y2": 217.0, "r_x3": 386.5, "r_y3": 217.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 398.6, "t": 217.2, "r": 405.8, "b": 226.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.5, "r_x1": 405.8, "r_y1": 226.5, "r_x2": 405.8, "r_y2": 217.2, "r_x3": 398.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 410.7, "t": 217.2, "r": 417.9, "b": 226.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.7, "r_y0": 226.5, "r_x1": 417.9, "r_y1": 226.5, "r_x2": 417.9, "r_y2": 217.2, "r_x3": 410.7, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 422.8, "t": 217.1, "r": 430.0, "b": 226.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.8, "r_y0": 226.5, "r_x1": 430.0, "r_y1": 226.5, "r_x2": 430.0, "r_y2": 217.1, "r_x3": 422.8, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 435.2, "t": 167.7, "r": 447.9, "b": 177.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.2, "r_y0": 177.0, "r_x1": 447.9, "r_y1": 177.0, "r_x2": 447.9, "r_y2": 167.7, "r_x3": 435.2, "r_y3": 167.7, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 435.4, "t": 180.2, "r": 448.1, "b": 189.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 189.5, "r_x1": 448.1, "r_y1": 189.5, "r_x2": 448.1, "r_y2": 180.2, "r_x3": 435.4, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 435.5, "t": 192.5, "r": 448.2, "b": 201.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 201.8, "r_x1": 448.2, "r_y1": 201.8, "r_x2": 448.2, "r_y2": 192.5, "r_x3": 435.5, "r_y3": 192.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 435.4, "t": 204.8, "r": 448.1, "b": 214.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 214.2, "r_x1": 448.1, "r_y1": 214.2, "r_x2": 448.1, "r_y2": 204.8, "r_x3": 435.4, "r_y3": 204.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 435.6, "t": 217.2, "r": 448.3, "b": 226.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.6, "r_x1": 448.3, "r_y1": 226.6, "r_x2": 448.3, "r_y2": 217.2, "r_x3": 435.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 374.1, "t": 205.2, "r": 381.3, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.1, "r_y0": 214.6, "r_x1": 381.3, "r_y1": 214.6, "r_x2": 381.3, "r_y2": 205.2, "r_x3": 374.1, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 374.0, "t": 217.1, "r": 381.2, "b": 226.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0, "r_y0": 226.5, "r_x1": 381.2, "r_y1": 226.5, "r_x2": 381.2, "r_y2": 217.1, "r_x3": 374.0, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 374.3, "t": 180.9, "r": 381.5, "b": 190.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.3, "r_y0": 190.3, "r_x1": 381.5, "r_y1": 190.3, "r_x2": 381.5, "r_y2": 180.9, "r_x3": 374.3, "r_y3": 180.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 387.8, "t": 168.6, "r": 393.3, "b": 177.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.8, "r_y0": 177.9, "r_x1": 393.3, "r_y1": 177.9, "r_x2": 393.3, "r_y2": 168.6, "r_x3": 387.8, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 411.9, "t": 168.1, "r": 417.4, "b": 177.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.9, "r_y0": 177.4, "r_x1": 417.4, "r_y1": 177.4, "r_x2": 417.4, "r_y2": 168.1, "r_x3": 411.9, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 423.3, "t": 167.9, "r": 428.9, "b": 177.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.3, "r_y0": 177.3, "r_x1": 428.9, "r_y1": 177.3, "r_x2": 428.9, "r_y2": 167.9, "r_x3": 423.3, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 387.1, "t": 180.8, "r": 393.8, "b": 190.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.1, "r_y0": 190.1, "r_x1": 393.8, "r_y1": 190.1, "r_x2": 393.8, "r_y2": 180.8, "r_x3": 387.1, "r_y3": 180.8, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 282.3, "t": 244.5, "r": 289.4, "b": 253.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.3, "r_y0": 253.8, "r_x1": 289.4, "r_y1": 253.8, "r_x2": 289.4, "r_y2": 244.5, "r_x3": 282.3, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 282.1, "t": 256.9, "r": 289.3, "b": 266.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.1, "r_y0": 266.2, "r_x1": 289.3, "r_y1": 266.2, "r_x2": 289.3, "r_y2": 256.9, "r_x3": 282.1, "r_y3": 256.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 282.4, "t": 269.1, "r": 289.6, "b": 278.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.4, "r_y0": 278.5, "r_x1": 289.6, "r_y1": 278.5, "r_x2": 289.6, "r_y2": 269.1, "r_x3": 282.4, "r_y3": 269.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 295.5, "t": 244.5, "r": 301.1, "b": 253.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.5, "r_y0": 253.8, "r_x1": 301.1, "r_y1": 253.8, "r_x2": 301.1, "r_y2": 244.5, "r_x3": 295.5, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 307.5, "t": 244.6, "r": 313.0, "b": 253.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.5, "r_y0": 253.9, "r_x1": 313.0, "r_y1": 253.9, "r_x2": 313.0, "r_y2": 244.6, "r_x3": 307.5, "r_y3": 244.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 318.8, "t": 244.4, "r": 324.3, "b": 253.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.8, "r_y0": 253.8, "r_x1": 324.3, "r_y1": 253.8, "r_x2": 324.3, "r_y2": 244.4, "r_x3": 318.8, "r_y3": 244.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 294.9, "t": 256.7, "r": 301.0, "b": 266.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.0, "r_x1": 301.0, "r_y1": 266.0, "r_x2": 301.0, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 307.2, "t": 256.7, "r": 325.6, "b": 266.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.2, "r_y0": 266.0, "r_x1": 325.6, "r_y1": 266.0, "r_x2": 325.6, "r_y2": 256.7, "r_x3": 307.2, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 294.8, "t": 269.3, "r": 300.9, "b": 278.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.8, "r_y0": 278.6, "r_x1": 300.9, "r_y1": 278.6, "r_x2": 300.9, "r_y2": 269.3, "r_x3": 294.8, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 307.1, "t": 269.3, "r": 325.5, "b": 278.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.1, "r_y0": 278.6, "r_x1": 325.5, "r_y1": 278.6, "r_x2": 325.5, "r_y2": 269.3, "r_x3": 307.1, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 195.9, "t": 268.7, "r": 203.1, "b": 278.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 278.1, "r_x1": 203.1, "r_y1": 278.1, "r_x2": 203.1, "r_y2": 268.7, "r_x3": 195.9, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 209.2, "t": 268.7, "r": 214.7, "b": 278.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.2, "r_y0": 278.1, "r_x1": 214.7, "r_y1": 278.1, "r_x2": 214.7, "r_y2": 268.7, "r_x3": 209.2, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 221.1, "t": 268.8, "r": 226.7, "b": 278.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.1, "r_y0": 278.1, "r_x1": 226.7, "r_y1": 278.1, "r_x2": 226.7, "r_y2": 268.8, "r_x3": 221.1, "r_y3": 268.8, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.4, "t": 268.7, "r": 238.0, "b": 278.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.4, "r_y0": 278.0, "r_x1": 238.0, "r_y1": 278.0, "r_x2": 238.0, "r_y2": 268.7, "r_x3": 232.4, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 196.2, "t": 244.5, "r": 203.4, "b": 253.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.2, "r_y0": 253.9, "r_x1": 203.4, "r_y1": 253.9, "r_x2": 203.4, "r_y2": 244.5, "r_x3": 196.2, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 250.3, "t": 244.1, "r": 257.5, "b": 253.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.3, "r_y0": 253.4, "r_x1": 257.5, "r_y1": 253.4, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.3, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 250.2, "t": 256.4, "r": 257.3, "b": 265.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.2, "r_y0": 265.8, "r_x1": 257.3, "r_y1": 265.8, "r_x2": 257.3, "r_y2": 256.4, "r_x3": 250.2, "r_y3": 256.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 250.5, "t": 268.7, "r": 257.6, "b": 278.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.5, "r_y0": 278.0, "r_x1": 257.6, "r_y1": 278.0, "r_x2": 257.6, "r_y2": 268.7, "r_x3": 250.5, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 334.5, "t": 243.0, "r": 337.2, "b": 249.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 249.2, "r_x1": 337.2, "r_y1": 249.2, "r_x2": 337.2, "r_y2": 243.0, "r_x3": 334.5, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 339.9, "t": 243.0, "r": 391.5, "b": 249.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.9, "r_y0": 249.2, "r_x1": 391.5, "r_y1": 249.2, "r_x2": 391.5, "r_y2": 243.0, "r_x3": 339.9, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 334.5, "t": 252.9, "r": 337.3, "b": 259.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 259.1, "r_x1": 337.3, "r_y1": 259.1, "r_x2": 337.3, "r_y2": 252.9, "r_x3": 334.5, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 340.2, "t": 252.9, "r": 422.0, "b": 259.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.2, "r_y0": 259.1, "r_x1": 422.0, "r_y1": 259.1, "r_x2": 422.0, "r_y2": 252.9, "r_x3": 340.2, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 334.5, "t": 262.9, "r": 337.3, "b": 269.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 269.1, "r_x1": 337.3, "r_y1": 269.1, "r_x2": 337.3, "r_y2": 262.9, "r_x3": 334.5, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 340.1, "t": 262.9, "r": 415.3, "b": 269.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 269.1, "r_x1": 415.3, "r_y1": 269.1, "r_x2": 415.3, "r_y2": 262.9, "r_x3": 340.1, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 334.5, "t": 272.8, "r": 426.6, "b": 279.0, "coord_origin": "TOPLEFT" }, "confidence": 0.53, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 279.0, "r_x1": 337.3, "r_y1": 279.0, "r_x2": 337.3, "r_y2": 272.8, "r_x3": 334.5, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 279.0, "r_x1": 426.6, "r_y1": 279.0, "r_x2": 426.6, "r_y2": 272.8, "r_x3": 340.1, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 185.7, "t": 244.0, "r": 189.4, "b": 250.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.7, "r_y0": 250.3, "r_x1": 189.4, "r_y1": 250.3, "r_x2": 189.4, "r_y2": 244.0, "r_x3": 185.7, "r_y3": 244.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 186.0, "t": 268.3, "r": 189.7, "b": 274.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.0, "r_y0": 274.6, "r_x1": 189.7, "r_y1": 274.6, "r_x2": 189.7, "r_y2": 268.3, "r_x3": 186.0, "r_y3": 268.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 239.3, "t": 243.6, "r": 243.0, "b": 249.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.3, "r_y0": 249.8, "r_x1": 243.0, "r_y1": 249.8, "r_x2": 243.0, "r_y2": 243.6, "r_x3": 239.3, "r_y3": 243.6, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 271.3, "t": 243.5, "r": 275.0, "b": 249.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 249.7, "r_x1": 275.0, "r_y1": 249.7, "r_x2": 275.0, "r_y2": 243.5, "r_x3": 271.3, "r_y3": 243.5, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 229.8, "t": 166.5, "r": 233.5, "b": 172.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.8, "r_y0": 172.7, "r_x1": 233.5, "r_y1": 172.7, "r_x2": 233.5, "r_y2": 166.5, "r_x3": 229.8, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 257.2, "t": 190.0, "r": 260.9, "b": 196.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.2, "r_y0": 196.2, "r_x1": 260.9, "r_y1": 196.2, "r_x2": 260.9, "r_y2": 190.0, "r_x3": 257.2, "r_y3": 190.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 186.9, "t": 178.0, "r": 190.6, "b": 184.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.9, "r_y0": 184.2, "r_x1": 190.6, "r_y1": 184.2, "r_x2": 190.6, "r_y2": 178.0, "r_x3": 186.9, "r_y3": 178.0, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 196.5, "t": 169.0, "r": 200.2, "b": 175.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.5, "r_y0": 175.2, "r_x1": 200.2, "r_y1": 175.2, "r_x2": 200.2, "r_y2": 169.0, "r_x3": 196.5, "r_y3": 169.0, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 169.7, "t": 167.9, "r": 175.7, "b": 175.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 175.7, "r_x1": 175.7, "r_y1": 175.7, "r_x2": 175.7, "r_y2": 167.9, "r_x3": 169.7, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 169.7, "t": 206.8, "r": 175.7, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 214.6, "r_x1": 175.7, "r_y1": 214.6, "r_x2": 175.7, "r_y2": 206.8, "r_x3": 169.7, "r_y3": 206.8, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 274.3, "t": 168.3, "r": 280.3, "b": 176.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.3, "r_y0": 176.0, "r_x1": 280.3, "r_y1": 176.0, "r_x2": 280.3, "r_y2": 168.3, "r_x3": 274.3, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 359.6, "t": 168.3, "r": 365.5, "b": 176.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.6, "r_y0": 176.0, "r_x1": 365.5, "r_y1": 176.0, "r_x2": 365.5, "r_y2": 168.3, "r_x3": 359.6, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 169.7, "t": 243.2, "r": 175.3, "b": 251.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 251.0, "r_x1": 175.3, "r_y1": 251.0, "r_x2": 175.3, "r_y2": 243.2, "r_x3": 169.7, "r_y3": 243.2, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "section_header", "id": 9, "page_no": 6, "cluster": { "id": 9, "label": "section_header", "bbox": { "l": 134.8, "t": 305.3, "r": 246.7, "b": 314.1, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 314.1, "r_x1": 149.4, "r_y1": 314.1, "r_x2": 149.4, "r_y2": 305.3, "r_x3": 134.8, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 314.1, "r_x1": 246.7, "r_y1": 314.1, "r_x2": 246.7, "r_y2": 305.3, "r_x3": 160.9, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.2 Language Syntax" }, { "label": "text", "id": 10, "page_no": 6, "cluster": { "id": 10, "label": "text", "bbox": { "l": 134.8, "t": 325.2, "r": 363.8, "b": 334.0, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 334.0, "r_x1": 363.8, "r_y1": 334.0, "r_x2": 363.8, "r_y2": 325.2, "r_x3": 134.8, "r_y3": 325.2, "coord_origin": "TOPLEFT" }, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The OTSL representation follows these syntax rules:" }, { "label": "list_item", "id": 3, "page_no": 6, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 139.0, "t": 347.2, "r": 480.6, "b": 367.9, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 356.0, "r_x1": 146.7, "r_y1": 356.0, "r_x2": 146.7, "r_y2": 347.2, "r_x3": 139.0, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 356.0, "r_x1": 257.4, "r_y1": 356.0, "r_x2": 257.4, "r_y2": 347.2, "r_x3": 151.7, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.4, "r_y0": 356.0, "r_x1": 480.6, "r_y1": 356.0, "r_x2": 480.6, "r_y2": 347.2, "r_x3": 257.4, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": ": The left neighbour of an \"L\" cell must be either", "orig": ": The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 367.9, "r_x1": 283.6, "r_y1": 367.9, "r_x2": 283.6, "r_y2": 359.1, "r_x3": 151.7, "r_y3": 359.1, "coord_origin": "TOPLEFT" }, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Left-looking cell rule : The left neighbour of an \"L\" cell must be either another \"L\" cell or a \"C\" cell." }, { "label": "list_item", "id": 4, "page_no": 6, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.0, "t": 371.1, "r": 480.6, "b": 391.8, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 379.9, "r_x1": 146.7, "r_y1": 379.9, "r_x2": 146.7, "r_y2": 371.1, "r_x3": 139.0, "r_y3": 371.1, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 379.9, "r_x1": 252.1, "r_y1": 379.9, "r_x2": 252.1, "r_y2": 371.1, "r_x3": 151.7, "r_y3": 371.1, "coord_origin": "TOPLEFT" }, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.1, "r_y0": 379.9, "r_x1": 480.6, "r_y1": 379.9, "r_x2": 480.6, "r_y2": 371.1, "r_x3": 252.1, "r_y3": 371.1, "coord_origin": "TOPLEFT" }, "text": ": The upper neighbour of a \"U\" cell must be either", "orig": ": The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 391.8, "r_x1": 284.8, "r_y1": 391.8, "r_x2": 284.8, "r_y2": 383.0, "r_x3": 151.7, "r_y3": 383.0, "coord_origin": "TOPLEFT" }, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Up-looking cell rule : The upper neighbour of a \"U\" cell must be either another \"U\" cell or a \"C\" cell." }, { "label": "section_header", "id": 14, "page_no": 6, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 139.0, "t": 395.0, "r": 226.1, "b": 403.8, "coord_origin": "TOPLEFT" }, "confidence": 0.65, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 403.8, "r_x1": 146.7, "r_y1": 403.8, "r_x2": 146.7, "r_y2": 395.0, "r_x3": 139.0, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 403.8, "r_x1": 223.3, "r_y1": 403.8, "r_x2": 223.3, "r_y2": 395.0, "r_x3": 151.7, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.3, "r_y0": 403.8, "r_x1": 226.1, "r_y1": 403.8, "r_x2": 226.1, "r_y2": 395.0, "r_x3": 223.3, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Cross cell rule :" }, { "label": "list_item", "id": 13, "page_no": 6, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 151.7, "t": 407.0, "r": 480.6, "b": 439.7, "coord_origin": "TOPLEFT" }, "confidence": 0.72, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 415.8, "r_x1": 480.6, "r_y1": 415.8, "r_x2": 480.6, "r_y2": 407.0, "r_x3": 151.7, "r_y3": 407.0, "coord_origin": "TOPLEFT" }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 427.7, "r_x1": 480.6, "r_y1": 427.7, "r_x2": 480.6, "r_y2": 418.9, "r_x3": 151.7, "r_y3": 418.9, "coord_origin": "TOPLEFT" }, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 439.7, "r_x1": 214.4, "r_y1": 439.7, "r_x2": 214.4, "r_y2": 430.9, "r_x3": 151.7, "r_y3": 430.9, "coord_origin": "TOPLEFT" }, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\" cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell or an \"L\" cell." }, { "label": "list_item", "id": 8, "page_no": 6, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 139.0, "t": 442.8, "r": 474.6, "b": 451.6, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 451.6, "r_x1": 146.7, "r_y1": 451.6, "r_x2": 146.7, "r_y2": 442.8, "r_x3": 139.0, "r_y3": 442.8, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 451.6, "r_x1": 221.3, "r_y1": 451.6, "r_x2": 221.3, "r_y2": 442.8, "r_x3": 151.7, "r_y3": 442.8, "coord_origin": "TOPLEFT" }, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.3, "r_y0": 451.6, "r_x1": 474.6, "r_y1": 451.6, "r_x2": 474.6, "r_y2": 442.8, "r_x3": 221.3, "r_y3": 442.8, "coord_origin": "TOPLEFT" }, "text": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. First row rule : Only \"L\" cells and \"C\" cells are allowed in the first row." }, { "label": "list_item", "id": 5, "page_no": 6, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.0, "t": 454.8, "r": 480.6, "b": 475.5, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 463.6, "r_x1": 146.7, "r_y1": 463.6, "r_x2": 146.7, "r_y2": 454.8, "r_x3": 139.0, "r_y3": 454.8, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 463.6, "r_x1": 240.7, "r_y1": 463.6, "r_x2": 240.7, "r_y2": 454.8, "r_x3": 151.7, "r_y3": 454.8, "coord_origin": "TOPLEFT" }, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.7, "r_y0": 463.6, "r_x1": 480.6, "r_y1": 463.6, "r_x2": 480.6, "r_y2": 454.8, "r_x3": 240.7, "r_y3": 454.8, "coord_origin": "TOPLEFT" }, "text": ": Only \"U\" cells and \"C\" cells are allowed in the first", "orig": ": Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 475.5, "r_x1": 186.0, "r_y1": 475.5, "r_x2": 186.0, "r_y2": 466.7, "r_x3": 151.7, "r_y3": 466.7, "coord_origin": "TOPLEFT" }, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. First column rule : Only \"U\" cells and \"C\" cells are allowed in the first column." }, { "label": "list_item", "id": 1, "page_no": 6, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 139.0, "t": 478.7, "r": 480.6, "b": 499.5, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 487.5, "r_x1": 146.7, "r_y1": 487.5, "r_x2": 146.7, "r_y2": 478.7, "r_x3": 139.0, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 487.5, "r_x1": 235.2, "r_y1": 487.5, "r_x2": 235.2, "r_y2": 478.7, "r_x3": 151.7, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.2, "r_y0": 487.5, "r_x1": 480.6, "r_y1": 487.5, "r_x2": 480.6, "r_y2": 478.7, "r_x3": 235.2, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 499.5, "r_x1": 448.0, "r_y1": 499.5, "r_x2": 448.0, "r_y2": 490.7, "r_x3": 151.7, "r_y3": 490.7, "coord_origin": "TOPLEFT" }, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Rectangular rule : The table representation is always rectangular - all rows must have an equal number of tokens, terminated with \"NL\" token." }, { "label": "text", "id": 0, "page_no": 6, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 512.6, "r": 480.6, "b": 640.9, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 521.4, "r_x1": 480.6, "r_y1": 521.4, "r_x2": 480.6, "r_y2": 512.6, "r_x3": 149.7, "r_y3": 512.6, "coord_origin": "TOPLEFT" }, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.5, "r_x3": 134.8, "r_y3": 524.5, "coord_origin": "TOPLEFT" }, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 480.6, "r_y1": 581.2, "r_x2": 480.6, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 311.2, "r_y1": 640.9, "r_x2": 311.2, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The application of these rules gives OTSL a set of unique properties. First of all, the OTSL enforces a strictly rectangular structure representation, where every new-line token starts a new row. As a consequence, all rows and all columns have exactly the same number of tokens, irrespective of cell spans. Secondly, the OTSL representation is unambiguous: Every table structure is represented in one way. In this representation every table cell corresponds to a \"C\"-cell token, which in case of spans is always located in the top-left corner of the table cell definition. Third, OTSL syntax rules are only backward-looking. As a consequence, every predicted token can be validated straight during sequence generation by looking at the previously predicted sequence. As such, OTSL can guarantee that every predicted sequence is syntactically valid." }, { "label": "text", "id": 2, "page_no": 6, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 644.1, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 149.7, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "These characteristics can be easily learned by sequence generator networks, as we demonstrate further below. We find strong indications that this pattern" } ], "body": [ { "label": "caption", "id": 6, "page_no": 6, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 134.8, "t": 125.8, "r": 480.6, "b": 155.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 133.7, "r_x1": 162.6, "r_y1": 133.7, "r_x2": 162.6, "r_y2": 125.8, "r_x3": 134.8, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.3, "r_y0": 133.9, "r_x1": 480.6, "r_y1": 133.9, "r_x2": 480.6, "r_y2": 125.9, "r_x3": 166.3, "r_y3": 125.9, "coord_origin": "TOPLEFT" }, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 144.9, "r_x1": 480.6, "r_y1": 144.9, "r_x2": 480.6, "r_y2": 136.8, "r_x3": 134.8, "r_y3": 136.8, "coord_origin": "TOPLEFT" }, "text": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "orig": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 155.8, "r_x1": 306.1, "r_y1": 155.8, "r_x2": 306.1, "r_y2": 147.8, "r_x3": 134.8, "r_y3": 147.8, "coord_origin": "TOPLEFT" }, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 3. OTSL description of table structure: A - table example; B - graphical representation of table structure; C - mapping structure on a grid; D - OTSL structure encoding; E - explanation on cell encoding" }, { "label": "picture", "id": 12, "page_no": 6, "cluster": { "id": 12, "label": "picture", "bbox": { "l": 164.7, "t": 163.8, "r": 449.6, "b": 280.3, "coord_origin": "TOPLEFT" }, "confidence": 0.79, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.5, "r_y0": 177.9, "r_x1": 381.7, "r_y1": 177.9, "r_x2": 381.7, "r_y2": 168.6, "r_x3": 374.5, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 177.8, "r_x1": 405.9, "r_y1": 177.8, "r_x2": 405.9, "r_y2": 168.5, "r_x3": 398.7, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.8, "r_y0": 202.2, "r_x1": 380.9, "r_y1": 202.2, "r_x2": 380.9, "r_y2": 192.9, "r_x3": 373.8, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 202.4, "r_x1": 393.8, "r_y1": 202.4, "r_x2": 393.8, "r_y2": 193.1, "r_x3": 386.7, "r_y3": 193.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 214.5, "r_x1": 393.9, "r_y1": 214.5, "r_x2": 393.9, "r_y2": 205.1, "r_x3": 386.7, "r_y3": 205.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 190.1, "r_x1": 405.8, "r_y1": 190.1, "r_x2": 405.8, "r_y2": 180.7, "r_x3": 398.7, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.8, "r_y0": 190.1, "r_x1": 418.0, "r_y1": 190.1, "r_x2": 418.0, "r_y2": 180.7, "r_x3": 410.8, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.9, "r_y0": 190.0, "r_x1": 430.1, "r_y1": 190.0, "r_x2": 430.1, "r_y2": 180.7, "r_x3": 422.9, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 202.3, "r_x1": 406.0, "r_y1": 202.3, "r_x2": 406.0, "r_y2": 193.0, "r_x3": 398.8, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.3, "r_x1": 418.1, "r_y1": 202.3, "r_x2": 418.1, "r_y2": 193.0, "r_x3": 410.9, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 202.2, "r_x1": 430.2, "r_y1": 202.2, "r_x2": 430.2, "r_y2": 192.9, "r_x3": 423.0, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 214.6, "r_x1": 406.0, "r_y1": 214.6, "r_x2": 406.0, "r_y2": 205.3, "r_x3": 398.8, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.6, "r_x1": 418.1, "r_y1": 214.6, "r_x2": 418.1, "r_y2": 205.3, "r_x3": 410.9, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 214.6, "r_x1": 430.2, "r_y1": 214.6, "r_x2": 430.2, "r_y2": 205.2, "r_x3": 423.0, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.5, "r_y0": 226.4, "r_x1": 393.7, "r_y1": 226.4, "r_x2": 393.7, "r_y2": 217.0, "r_x3": 386.5, "r_y3": 217.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.5, "r_x1": 405.8, "r_y1": 226.5, "r_x2": 405.8, "r_y2": 217.2, "r_x3": 398.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.7, "r_y0": 226.5, "r_x1": 417.9, "r_y1": 226.5, "r_x2": 417.9, "r_y2": 217.2, "r_x3": 410.7, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.8, "r_y0": 226.5, "r_x1": 430.0, "r_y1": 226.5, "r_x2": 430.0, "r_y2": 217.1, "r_x3": 422.8, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.2, "r_y0": 177.0, "r_x1": 447.9, "r_y1": 177.0, "r_x2": 447.9, "r_y2": 167.7, "r_x3": 435.2, "r_y3": 167.7, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 189.5, "r_x1": 448.1, "r_y1": 189.5, "r_x2": 448.1, "r_y2": 180.2, "r_x3": 435.4, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 201.8, "r_x1": 448.2, "r_y1": 201.8, "r_x2": 448.2, "r_y2": 192.5, "r_x3": 435.5, "r_y3": 192.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 214.2, "r_x1": 448.1, "r_y1": 214.2, "r_x2": 448.1, "r_y2": 204.8, "r_x3": 435.4, "r_y3": 204.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.6, "r_x1": 448.3, "r_y1": 226.6, "r_x2": 448.3, "r_y2": 217.2, "r_x3": 435.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.1, "r_y0": 214.6, "r_x1": 381.3, "r_y1": 214.6, "r_x2": 381.3, "r_y2": 205.2, "r_x3": 374.1, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0, "r_y0": 226.5, "r_x1": 381.2, "r_y1": 226.5, "r_x2": 381.2, "r_y2": 217.1, "r_x3": 374.0, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.3, "r_y0": 190.3, "r_x1": 381.5, "r_y1": 190.3, "r_x2": 381.5, "r_y2": 180.9, "r_x3": 374.3, "r_y3": 180.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.8, "r_y0": 177.9, "r_x1": 393.3, "r_y1": 177.9, "r_x2": 393.3, "r_y2": 168.6, "r_x3": 387.8, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.9, "r_y0": 177.4, "r_x1": 417.4, "r_y1": 177.4, "r_x2": 417.4, "r_y2": 168.1, "r_x3": 411.9, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.3, "r_y0": 177.3, "r_x1": 428.9, "r_y1": 177.3, "r_x2": 428.9, "r_y2": 167.9, "r_x3": 423.3, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.1, "r_y0": 190.1, "r_x1": 393.8, "r_y1": 190.1, "r_x2": 393.8, "r_y2": 180.8, "r_x3": 387.1, "r_y3": 180.8, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.3, "r_y0": 253.8, "r_x1": 289.4, "r_y1": 253.8, "r_x2": 289.4, "r_y2": 244.5, "r_x3": 282.3, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.1, "r_y0": 266.2, "r_x1": 289.3, "r_y1": 266.2, "r_x2": 289.3, "r_y2": 256.9, "r_x3": 282.1, "r_y3": 256.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.4, "r_y0": 278.5, "r_x1": 289.6, "r_y1": 278.5, "r_x2": 289.6, "r_y2": 269.1, "r_x3": 282.4, "r_y3": 269.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.5, "r_y0": 253.8, "r_x1": 301.1, "r_y1": 253.8, "r_x2": 301.1, "r_y2": 244.5, "r_x3": 295.5, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.5, "r_y0": 253.9, "r_x1": 313.0, "r_y1": 253.9, "r_x2": 313.0, "r_y2": 244.6, "r_x3": 307.5, "r_y3": 244.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.8, "r_y0": 253.8, "r_x1": 324.3, "r_y1": 253.8, "r_x2": 324.3, "r_y2": 244.4, "r_x3": 318.8, "r_y3": 244.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.0, "r_x1": 301.0, "r_y1": 266.0, "r_x2": 301.0, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.2, "r_y0": 266.0, "r_x1": 325.6, "r_y1": 266.0, "r_x2": 325.6, "r_y2": 256.7, "r_x3": 307.2, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.8, "r_y0": 278.6, "r_x1": 300.9, "r_y1": 278.6, "r_x2": 300.9, "r_y2": 269.3, "r_x3": 294.8, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.1, "r_y0": 278.6, "r_x1": 325.5, "r_y1": 278.6, "r_x2": 325.5, "r_y2": 269.3, "r_x3": 307.1, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 278.1, "r_x1": 203.1, "r_y1": 278.1, "r_x2": 203.1, "r_y2": 268.7, "r_x3": 195.9, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.2, "r_y0": 278.1, "r_x1": 214.7, "r_y1": 278.1, "r_x2": 214.7, "r_y2": 268.7, "r_x3": 209.2, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.1, "r_y0": 278.1, "r_x1": 226.7, "r_y1": 278.1, "r_x2": 226.7, "r_y2": 268.8, "r_x3": 221.1, "r_y3": 268.8, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.4, "r_y0": 278.0, "r_x1": 238.0, "r_y1": 278.0, "r_x2": 238.0, "r_y2": 268.7, "r_x3": 232.4, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.2, "r_y0": 253.9, "r_x1": 203.4, "r_y1": 253.9, "r_x2": 203.4, "r_y2": 244.5, "r_x3": 196.2, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.3, "r_y0": 253.4, "r_x1": 257.5, "r_y1": 253.4, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.3, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.2, "r_y0": 265.8, "r_x1": 257.3, "r_y1": 265.8, "r_x2": 257.3, "r_y2": 256.4, "r_x3": 250.2, "r_y3": 256.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.5, "r_y0": 278.0, "r_x1": 257.6, "r_y1": 278.0, "r_x2": 257.6, "r_y2": 268.7, "r_x3": 250.5, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 249.2, "r_x1": 337.2, "r_y1": 249.2, "r_x2": 337.2, "r_y2": 243.0, "r_x3": 334.5, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.9, "r_y0": 249.2, "r_x1": 391.5, "r_y1": 249.2, "r_x2": 391.5, "r_y2": 243.0, "r_x3": 339.9, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 259.1, "r_x1": 337.3, "r_y1": 259.1, "r_x2": 337.3, "r_y2": 252.9, "r_x3": 334.5, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.2, "r_y0": 259.1, "r_x1": 422.0, "r_y1": 259.1, "r_x2": 422.0, "r_y2": 252.9, "r_x3": 340.2, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 269.1, "r_x1": 337.3, "r_y1": 269.1, "r_x2": 337.3, "r_y2": 262.9, "r_x3": 334.5, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 269.1, "r_x1": 415.3, "r_y1": 269.1, "r_x2": 415.3, "r_y2": 262.9, "r_x3": 340.1, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 279.0, "r_x1": 337.3, "r_y1": 279.0, "r_x2": 337.3, "r_y2": 272.8, "r_x3": 334.5, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 279.0, "r_x1": 426.6, "r_y1": 279.0, "r_x2": 426.6, "r_y2": 272.8, "r_x3": 340.1, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.7, "r_y0": 250.3, "r_x1": 189.4, "r_y1": 250.3, "r_x2": 189.4, "r_y2": 244.0, "r_x3": 185.7, "r_y3": 244.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.0, "r_y0": 274.6, "r_x1": 189.7, "r_y1": 274.6, "r_x2": 189.7, "r_y2": 268.3, "r_x3": 186.0, "r_y3": 268.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.3, "r_y0": 249.8, "r_x1": 243.0, "r_y1": 249.8, "r_x2": 243.0, "r_y2": 243.6, "r_x3": 239.3, "r_y3": 243.6, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 249.7, "r_x1": 275.0, "r_y1": 249.7, "r_x2": 275.0, "r_y2": 243.5, "r_x3": 271.3, "r_y3": 243.5, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.8, "r_y0": 172.7, "r_x1": 233.5, "r_y1": 172.7, "r_x2": 233.5, "r_y2": 166.5, "r_x3": 229.8, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.2, "r_y0": 196.2, "r_x1": 260.9, "r_y1": 196.2, "r_x2": 260.9, "r_y2": 190.0, "r_x3": 257.2, "r_y3": 190.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.9, "r_y0": 184.2, "r_x1": 190.6, "r_y1": 184.2, "r_x2": 190.6, "r_y2": 178.0, "r_x3": 186.9, "r_y3": 178.0, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.5, "r_y0": 175.2, "r_x1": 200.2, "r_y1": 175.2, "r_x2": 200.2, "r_y2": 169.0, "r_x3": 196.5, "r_y3": 169.0, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 175.7, "r_x1": 175.7, "r_y1": 175.7, "r_x2": 175.7, "r_y2": 167.9, "r_x3": 169.7, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 214.6, "r_x1": 175.7, "r_y1": 214.6, "r_x2": 175.7, "r_y2": 206.8, "r_x3": 169.7, "r_y3": 206.8, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.3, "r_y0": 176.0, "r_x1": 280.3, "r_y1": 176.0, "r_x2": 280.3, "r_y2": 168.3, "r_x3": 274.3, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.6, "r_y0": 176.0, "r_x1": 365.5, "r_y1": 176.0, "r_x2": 365.5, "r_y2": 168.3, "r_x3": 359.6, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 251.0, "r_x1": 175.3, "r_y1": 251.0, "r_x2": 175.3, "r_y2": 243.2, "r_x3": 169.7, "r_y3": 243.2, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 38, "label": "text", "bbox": { "l": 374.5, "t": 168.6, "r": 381.7, "b": 177.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.5, "r_y0": 177.9, "r_x1": 381.7, "r_y1": 177.9, "r_x2": 381.7, "r_y2": 168.6, "r_x3": 374.5, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 398.7, "t": 168.5, "r": 405.9, "b": 177.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 177.8, "r_x1": 405.9, "r_y1": 177.8, "r_x2": 405.9, "r_y2": 168.5, "r_x3": 398.7, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 373.8, "t": 192.9, "r": 380.9, "b": 202.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.8, "r_y0": 202.2, "r_x1": 380.9, "r_y1": 202.2, "r_x2": 380.9, "r_y2": 192.9, "r_x3": 373.8, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 386.7, "t": 193.1, "r": 393.8, "b": 202.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 202.4, "r_x1": 393.8, "r_y1": 202.4, "r_x2": 393.8, "r_y2": 193.1, "r_x3": 386.7, "r_y3": 193.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 386.7, "t": 205.1, "r": 393.9, "b": 214.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.7, "r_y0": 214.5, "r_x1": 393.9, "r_y1": 214.5, "r_x2": 393.9, "r_y2": 205.1, "r_x3": 386.7, "r_y3": 205.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 398.7, "t": 180.7, "r": 405.8, "b": 190.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.7, "r_y0": 190.1, "r_x1": 405.8, "r_y1": 190.1, "r_x2": 405.8, "r_y2": 180.7, "r_x3": 398.7, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 410.8, "t": 180.7, "r": 418.0, "b": 190.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.8, "r_y0": 190.1, "r_x1": 418.0, "r_y1": 190.1, "r_x2": 418.0, "r_y2": 180.7, "r_x3": 410.8, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 422.9, "t": 180.7, "r": 430.1, "b": 190.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.9, "r_y0": 190.0, "r_x1": 430.1, "r_y1": 190.0, "r_x2": 430.1, "r_y2": 180.7, "r_x3": 422.9, "r_y3": 180.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 398.8, "t": 193.0, "r": 406.0, "b": 202.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 202.3, "r_x1": 406.0, "r_y1": 202.3, "r_x2": 406.0, "r_y2": 193.0, "r_x3": 398.8, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 410.9, "t": 193.0, "r": 418.1, "b": 202.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.3, "r_x1": 418.1, "r_y1": 202.3, "r_x2": 418.1, "r_y2": 193.0, "r_x3": 410.9, "r_y3": 193.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 423.0, "t": 192.9, "r": 430.2, "b": 202.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 202.2, "r_x1": 430.2, "r_y1": 202.2, "r_x2": 430.2, "r_y2": 192.9, "r_x3": 423.0, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 398.8, "t": 205.3, "r": 406.0, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.8, "r_y0": 214.6, "r_x1": 406.0, "r_y1": 214.6, "r_x2": 406.0, "r_y2": 205.3, "r_x3": 398.8, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 410.9, "t": 205.3, "r": 418.1, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.6, "r_x1": 418.1, "r_y1": 214.6, "r_x2": 418.1, "r_y2": 205.3, "r_x3": 410.9, "r_y3": 205.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 423.0, "t": 205.2, "r": 430.2, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.0, "r_y0": 214.6, "r_x1": 430.2, "r_y1": 214.6, "r_x2": 430.2, "r_y2": 205.2, "r_x3": 423.0, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 386.5, "t": 217.0, "r": 393.7, "b": 226.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.5, "r_y0": 226.4, "r_x1": 393.7, "r_y1": 226.4, "r_x2": 393.7, "r_y2": 217.0, "r_x3": 386.5, "r_y3": 217.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 398.6, "t": 217.2, "r": 405.8, "b": 226.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.5, "r_x1": 405.8, "r_y1": 226.5, "r_x2": 405.8, "r_y2": 217.2, "r_x3": 398.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 410.7, "t": 217.2, "r": 417.9, "b": 226.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.7, "r_y0": 226.5, "r_x1": 417.9, "r_y1": 226.5, "r_x2": 417.9, "r_y2": 217.2, "r_x3": 410.7, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 422.8, "t": 217.1, "r": 430.0, "b": 226.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.8, "r_y0": 226.5, "r_x1": 430.0, "r_y1": 226.5, "r_x2": 430.0, "r_y2": 217.1, "r_x3": 422.8, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 435.2, "t": 167.7, "r": 447.9, "b": 177.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.2, "r_y0": 177.0, "r_x1": 447.9, "r_y1": 177.0, "r_x2": 447.9, "r_y2": 167.7, "r_x3": 435.2, "r_y3": 167.7, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 435.4, "t": 180.2, "r": 448.1, "b": 189.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 189.5, "r_x1": 448.1, "r_y1": 189.5, "r_x2": 448.1, "r_y2": 180.2, "r_x3": 435.4, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 435.5, "t": 192.5, "r": 448.2, "b": 201.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 201.8, "r_x1": 448.2, "r_y1": 201.8, "r_x2": 448.2, "r_y2": 192.5, "r_x3": 435.5, "r_y3": 192.5, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 435.4, "t": 204.8, "r": 448.1, "b": 214.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.4, "r_y0": 214.2, "r_x1": 448.1, "r_y1": 214.2, "r_x2": 448.1, "r_y2": 204.8, "r_x3": 435.4, "r_y3": 204.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 435.6, "t": 217.2, "r": 448.3, "b": 226.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.6, "r_x1": 448.3, "r_y1": 226.6, "r_x2": 448.3, "r_y2": 217.2, "r_x3": 435.6, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 374.1, "t": 205.2, "r": 381.3, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.1, "r_y0": 214.6, "r_x1": 381.3, "r_y1": 214.6, "r_x2": 381.3, "r_y2": 205.2, "r_x3": 374.1, "r_y3": 205.2, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 374.0, "t": 217.1, "r": 381.2, "b": 226.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.0, "r_y0": 226.5, "r_x1": 381.2, "r_y1": 226.5, "r_x2": 381.2, "r_y2": 217.1, "r_x3": 374.0, "r_y3": 217.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 374.3, "t": 180.9, "r": 381.5, "b": 190.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.3, "r_y0": 190.3, "r_x1": 381.5, "r_y1": 190.3, "r_x2": 381.5, "r_y2": 180.9, "r_x3": 374.3, "r_y3": 180.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 387.8, "t": 168.6, "r": 393.3, "b": 177.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.8, "r_y0": 177.9, "r_x1": 393.3, "r_y1": 177.9, "r_x2": 393.3, "r_y2": 168.6, "r_x3": 387.8, "r_y3": 168.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 411.9, "t": 168.1, "r": 417.4, "b": 177.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.9, "r_y0": 177.4, "r_x1": 417.4, "r_y1": 177.4, "r_x2": 417.4, "r_y2": 168.1, "r_x3": 411.9, "r_y3": 168.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 423.3, "t": 167.9, "r": 428.9, "b": 177.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.3, "r_y0": 177.3, "r_x1": 428.9, "r_y1": 177.3, "r_x2": 428.9, "r_y2": 167.9, "r_x3": 423.3, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 387.1, "t": 180.8, "r": 393.8, "b": 190.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.1, "r_y0": 190.1, "r_x1": 393.8, "r_y1": 190.1, "r_x2": 393.8, "r_y2": 180.8, "r_x3": 387.1, "r_y3": 180.8, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 282.3, "t": 244.5, "r": 289.4, "b": 253.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.3, "r_y0": 253.8, "r_x1": 289.4, "r_y1": 253.8, "r_x2": 289.4, "r_y2": 244.5, "r_x3": 282.3, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 282.1, "t": 256.9, "r": 289.3, "b": 266.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.1, "r_y0": 266.2, "r_x1": 289.3, "r_y1": 266.2, "r_x2": 289.3, "r_y2": 256.9, "r_x3": 282.1, "r_y3": 256.9, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 282.4, "t": 269.1, "r": 289.6, "b": 278.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.4, "r_y0": 278.5, "r_x1": 289.6, "r_y1": 278.5, "r_x2": 289.6, "r_y2": 269.1, "r_x3": 282.4, "r_y3": 269.1, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 295.5, "t": 244.5, "r": 301.1, "b": 253.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.5, "r_y0": 253.8, "r_x1": 301.1, "r_y1": 253.8, "r_x2": 301.1, "r_y2": 244.5, "r_x3": 295.5, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 307.5, "t": 244.6, "r": 313.0, "b": 253.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.5, "r_y0": 253.9, "r_x1": 313.0, "r_y1": 253.9, "r_x2": 313.0, "r_y2": 244.6, "r_x3": 307.5, "r_y3": 244.6, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 318.8, "t": 244.4, "r": 324.3, "b": 253.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.8, "r_y0": 253.8, "r_x1": 324.3, "r_y1": 253.8, "r_x2": 324.3, "r_y2": 244.4, "r_x3": 318.8, "r_y3": 244.4, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 294.9, "t": 256.7, "r": 301.0, "b": 266.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.0, "r_x1": 301.0, "r_y1": 266.0, "r_x2": 301.0, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 307.2, "t": 256.7, "r": 325.6, "b": 266.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.2, "r_y0": 266.0, "r_x1": 325.6, "r_y1": 266.0, "r_x2": 325.6, "r_y2": 256.7, "r_x3": 307.2, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 294.8, "t": 269.3, "r": 300.9, "b": 278.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.8, "r_y0": 278.6, "r_x1": 300.9, "r_y1": 278.6, "r_x2": 300.9, "r_y2": 269.3, "r_x3": 294.8, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 307.1, "t": 269.3, "r": 325.5, "b": 278.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.1, "r_y0": 278.6, "r_x1": 325.5, "r_y1": 278.6, "r_x2": 325.5, "r_y2": 269.3, "r_x3": 307.1, "r_y3": 269.3, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 195.9, "t": 268.7, "r": 203.1, "b": 278.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 278.1, "r_x1": 203.1, "r_y1": 278.1, "r_x2": 203.1, "r_y2": 268.7, "r_x3": 195.9, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 209.2, "t": 268.7, "r": 214.7, "b": 278.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.2, "r_y0": 278.1, "r_x1": 214.7, "r_y1": 278.1, "r_x2": 214.7, "r_y2": 268.7, "r_x3": 209.2, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 221.1, "t": 268.8, "r": 226.7, "b": 278.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.1, "r_y0": 278.1, "r_x1": 226.7, "r_y1": 278.1, "r_x2": 226.7, "r_y2": 268.8, "r_x3": 221.1, "r_y3": 268.8, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.4, "t": 268.7, "r": 238.0, "b": 278.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.4, "r_y0": 278.0, "r_x1": 238.0, "r_y1": 278.0, "r_x2": 238.0, "r_y2": 268.7, "r_x3": 232.4, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 196.2, "t": 244.5, "r": 203.4, "b": 253.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.2, "r_y0": 253.9, "r_x1": 203.4, "r_y1": 253.9, "r_x2": 203.4, "r_y2": 244.5, "r_x3": 196.2, "r_y3": 244.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 250.3, "t": 244.1, "r": 257.5, "b": 253.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.3, "r_y0": 253.4, "r_x1": 257.5, "r_y1": 253.4, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.3, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 250.2, "t": 256.4, "r": 257.3, "b": 265.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.2, "r_y0": 265.8, "r_x1": 257.3, "r_y1": 265.8, "r_x2": 257.3, "r_y2": 256.4, "r_x3": 250.2, "r_y3": 256.4, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 250.5, "t": 268.7, "r": 257.6, "b": 278.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.5, "r_y0": 278.0, "r_x1": 257.6, "r_y1": 278.0, "r_x2": 257.6, "r_y2": 268.7, "r_x3": 250.5, "r_y3": 268.7, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 334.5, "t": 243.0, "r": 337.2, "b": 249.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 249.2, "r_x1": 337.2, "r_y1": 249.2, "r_x2": 337.2, "r_y2": 243.0, "r_x3": 334.5, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 339.9, "t": 243.0, "r": 391.5, "b": 249.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.9, "r_y0": 249.2, "r_x1": 391.5, "r_y1": 249.2, "r_x2": 391.5, "r_y2": 243.0, "r_x3": 339.9, "r_y3": 243.0, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 334.5, "t": 252.9, "r": 337.3, "b": 259.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 259.1, "r_x1": 337.3, "r_y1": 259.1, "r_x2": 337.3, "r_y2": 252.9, "r_x3": 334.5, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 340.2, "t": 252.9, "r": 422.0, "b": 259.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.2, "r_y0": 259.1, "r_x1": 422.0, "r_y1": 259.1, "r_x2": 422.0, "r_y2": 252.9, "r_x3": 340.2, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 334.5, "t": 262.9, "r": 337.3, "b": 269.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 269.1, "r_x1": 337.3, "r_y1": 269.1, "r_x2": 337.3, "r_y2": 262.9, "r_x3": 334.5, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 340.1, "t": 262.9, "r": 415.3, "b": 269.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 269.1, "r_x1": 415.3, "r_y1": 269.1, "r_x2": 415.3, "r_y2": 262.9, "r_x3": 340.1, "r_y3": 262.9, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 334.5, "t": 272.8, "r": 426.6, "b": 279.0, "coord_origin": "TOPLEFT" }, "confidence": 0.53, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 279.0, "r_x1": 337.3, "r_y1": 279.0, "r_x2": 337.3, "r_y2": 272.8, "r_x3": 334.5, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.1, "r_y0": 279.0, "r_x1": 426.6, "r_y1": 279.0, "r_x2": 426.6, "r_y2": 272.8, "r_x3": 340.1, "r_y3": 272.8, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 185.7, "t": 244.0, "r": 189.4, "b": 250.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.7, "r_y0": 250.3, "r_x1": 189.4, "r_y1": 250.3, "r_x2": 189.4, "r_y2": 244.0, "r_x3": 185.7, "r_y3": 244.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 186.0, "t": 268.3, "r": 189.7, "b": 274.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.0, "r_y0": 274.6, "r_x1": 189.7, "r_y1": 274.6, "r_x2": 189.7, "r_y2": 268.3, "r_x3": 186.0, "r_y3": 268.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 239.3, "t": 243.6, "r": 243.0, "b": 249.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.3, "r_y0": 249.8, "r_x1": 243.0, "r_y1": 249.8, "r_x2": 243.0, "r_y2": 243.6, "r_x3": 239.3, "r_y3": 243.6, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 271.3, "t": 243.5, "r": 275.0, "b": 249.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.3, "r_y0": 249.7, "r_x1": 275.0, "r_y1": 249.7, "r_x2": 275.0, "r_y2": 243.5, "r_x3": 271.3, "r_y3": 243.5, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 229.8, "t": 166.5, "r": 233.5, "b": 172.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.8, "r_y0": 172.7, "r_x1": 233.5, "r_y1": 172.7, "r_x2": 233.5, "r_y2": 166.5, "r_x3": 229.8, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 257.2, "t": 190.0, "r": 260.9, "b": 196.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.2, "r_y0": 196.2, "r_x1": 260.9, "r_y1": 196.2, "r_x2": 260.9, "r_y2": 190.0, "r_x3": 257.2, "r_y3": 190.0, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 186.9, "t": 178.0, "r": 190.6, "b": 184.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.9, "r_y0": 184.2, "r_x1": 190.6, "r_y1": 184.2, "r_x2": 190.6, "r_y2": 178.0, "r_x3": 186.9, "r_y3": 178.0, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 196.5, "t": 169.0, "r": 200.2, "b": 175.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.5, "r_y0": 175.2, "r_x1": 200.2, "r_y1": 175.2, "r_x2": 200.2, "r_y2": 169.0, "r_x3": 196.5, "r_y3": 169.0, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 169.7, "t": 167.9, "r": 175.7, "b": 175.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 175.7, "r_x1": 175.7, "r_y1": 175.7, "r_x2": 175.7, "r_y2": 167.9, "r_x3": 169.7, "r_y3": 167.9, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 169.7, "t": 206.8, "r": 175.7, "b": 214.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 214.6, "r_x1": 175.7, "r_y1": 214.6, "r_x2": 175.7, "r_y2": 206.8, "r_x3": 169.7, "r_y3": 206.8, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 274.3, "t": 168.3, "r": 280.3, "b": 176.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.3, "r_y0": 176.0, "r_x1": 280.3, "r_y1": 176.0, "r_x2": 280.3, "r_y2": 168.3, "r_x3": 274.3, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 359.6, "t": 168.3, "r": 365.5, "b": 176.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.6, "r_y0": 176.0, "r_x1": 365.5, "r_y1": 176.0, "r_x2": 365.5, "r_y2": 168.3, "r_x3": 359.6, "r_y3": 168.3, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 169.7, "t": 243.2, "r": 175.3, "b": 251.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.7, "r_y0": 251.0, "r_x1": 175.3, "r_y1": 251.0, "r_x2": 175.3, "r_y2": 243.2, "r_x3": 169.7, "r_y3": 243.2, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "section_header", "id": 9, "page_no": 6, "cluster": { "id": 9, "label": "section_header", "bbox": { "l": 134.8, "t": 305.3, "r": 246.7, "b": 314.1, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 314.1, "r_x1": 149.4, "r_y1": 314.1, "r_x2": 149.4, "r_y2": 305.3, "r_x3": 134.8, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 314.1, "r_x1": 246.7, "r_y1": 314.1, "r_x2": 246.7, "r_y2": 305.3, "r_x3": 160.9, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.2 Language Syntax" }, { "label": "text", "id": 10, "page_no": 6, "cluster": { "id": 10, "label": "text", "bbox": { "l": 134.8, "t": 325.2, "r": 363.8, "b": 334.0, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 334.0, "r_x1": 363.8, "r_y1": 334.0, "r_x2": 363.8, "r_y2": 325.2, "r_x3": 134.8, "r_y3": 325.2, "coord_origin": "TOPLEFT" }, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The OTSL representation follows these syntax rules:" }, { "label": "list_item", "id": 3, "page_no": 6, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 139.0, "t": 347.2, "r": 480.6, "b": 367.9, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 356.0, "r_x1": 146.7, "r_y1": 356.0, "r_x2": 146.7, "r_y2": 347.2, "r_x3": 139.0, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 356.0, "r_x1": 257.4, "r_y1": 356.0, "r_x2": 257.4, "r_y2": 347.2, "r_x3": 151.7, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.4, "r_y0": 356.0, "r_x1": 480.6, "r_y1": 356.0, "r_x2": 480.6, "r_y2": 347.2, "r_x3": 257.4, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": ": The left neighbour of an \"L\" cell must be either", "orig": ": The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 367.9, "r_x1": 283.6, "r_y1": 367.9, "r_x2": 283.6, "r_y2": 359.1, "r_x3": 151.7, "r_y3": 359.1, "coord_origin": "TOPLEFT" }, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Left-looking cell rule : The left neighbour of an \"L\" cell must be either another \"L\" cell or a \"C\" cell." }, { "label": "list_item", "id": 4, "page_no": 6, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.0, "t": 371.1, "r": 480.6, "b": 391.8, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 379.9, "r_x1": 146.7, "r_y1": 379.9, "r_x2": 146.7, "r_y2": 371.1, "r_x3": 139.0, "r_y3": 371.1, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 379.9, "r_x1": 252.1, "r_y1": 379.9, "r_x2": 252.1, "r_y2": 371.1, "r_x3": 151.7, "r_y3": 371.1, "coord_origin": "TOPLEFT" }, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.1, "r_y0": 379.9, "r_x1": 480.6, "r_y1": 379.9, "r_x2": 480.6, "r_y2": 371.1, "r_x3": 252.1, "r_y3": 371.1, "coord_origin": "TOPLEFT" }, "text": ": The upper neighbour of a \"U\" cell must be either", "orig": ": The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 391.8, "r_x1": 284.8, "r_y1": 391.8, "r_x2": 284.8, "r_y2": 383.0, "r_x3": 151.7, "r_y3": 383.0, "coord_origin": "TOPLEFT" }, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Up-looking cell rule : The upper neighbour of a \"U\" cell must be either another \"U\" cell or a \"C\" cell." }, { "label": "section_header", "id": 14, "page_no": 6, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 139.0, "t": 395.0, "r": 226.1, "b": 403.8, "coord_origin": "TOPLEFT" }, "confidence": 0.65, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 403.8, "r_x1": 146.7, "r_y1": 403.8, "r_x2": 146.7, "r_y2": 395.0, "r_x3": 139.0, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 403.8, "r_x1": 223.3, "r_y1": 403.8, "r_x2": 223.3, "r_y2": 395.0, "r_x3": 151.7, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.3, "r_y0": 403.8, "r_x1": 226.1, "r_y1": 403.8, "r_x2": 226.1, "r_y2": 395.0, "r_x3": 223.3, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Cross cell rule :" }, { "label": "list_item", "id": 13, "page_no": 6, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 151.7, "t": 407.0, "r": 480.6, "b": 439.7, "coord_origin": "TOPLEFT" }, "confidence": 0.72, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 415.8, "r_x1": 480.6, "r_y1": 415.8, "r_x2": 480.6, "r_y2": 407.0, "r_x3": 151.7, "r_y3": 407.0, "coord_origin": "TOPLEFT" }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 427.7, "r_x1": 480.6, "r_y1": 427.7, "r_x2": 480.6, "r_y2": 418.9, "r_x3": 151.7, "r_y3": 418.9, "coord_origin": "TOPLEFT" }, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 439.7, "r_x1": 214.4, "r_y1": 439.7, "r_x2": 214.4, "r_y2": 430.9, "r_x3": 151.7, "r_y3": 430.9, "coord_origin": "TOPLEFT" }, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\" cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell or an \"L\" cell." }, { "label": "list_item", "id": 8, "page_no": 6, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 139.0, "t": 442.8, "r": 474.6, "b": 451.6, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 451.6, "r_x1": 146.7, "r_y1": 451.6, "r_x2": 146.7, "r_y2": 442.8, "r_x3": 139.0, "r_y3": 442.8, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 451.6, "r_x1": 221.3, "r_y1": 451.6, "r_x2": 221.3, "r_y2": 442.8, "r_x3": 151.7, "r_y3": 442.8, "coord_origin": "TOPLEFT" }, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.3, "r_y0": 451.6, "r_x1": 474.6, "r_y1": 451.6, "r_x2": 474.6, "r_y2": 442.8, "r_x3": 221.3, "r_y3": 442.8, "coord_origin": "TOPLEFT" }, "text": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. First row rule : Only \"L\" cells and \"C\" cells are allowed in the first row." }, { "label": "list_item", "id": 5, "page_no": 6, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.0, "t": 454.8, "r": 480.6, "b": 475.5, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 463.6, "r_x1": 146.7, "r_y1": 463.6, "r_x2": 146.7, "r_y2": 454.8, "r_x3": 139.0, "r_y3": 454.8, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 463.6, "r_x1": 240.7, "r_y1": 463.6, "r_x2": 240.7, "r_y2": 454.8, "r_x3": 151.7, "r_y3": 454.8, "coord_origin": "TOPLEFT" }, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.7, "r_y0": 463.6, "r_x1": 480.6, "r_y1": 463.6, "r_x2": 480.6, "r_y2": 454.8, "r_x3": 240.7, "r_y3": 454.8, "coord_origin": "TOPLEFT" }, "text": ": Only \"U\" cells and \"C\" cells are allowed in the first", "orig": ": Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 475.5, "r_x1": 186.0, "r_y1": 475.5, "r_x2": 186.0, "r_y2": 466.7, "r_x3": 151.7, "r_y3": 466.7, "coord_origin": "TOPLEFT" }, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. First column rule : Only \"U\" cells and \"C\" cells are allowed in the first column." }, { "label": "list_item", "id": 1, "page_no": 6, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 139.0, "t": 478.7, "r": 480.6, "b": 499.5, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.0, "r_y0": 487.5, "r_x1": 146.7, "r_y1": 487.5, "r_x2": 146.7, "r_y2": 478.7, "r_x3": 139.0, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 487.5, "r_x1": 235.2, "r_y1": 487.5, "r_x2": 235.2, "r_y2": 478.7, "r_x3": 151.7, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.2, "r_y0": 487.5, "r_x1": 480.6, "r_y1": 487.5, "r_x2": 480.6, "r_y2": 478.7, "r_x3": 235.2, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 499.5, "r_x1": 448.0, "r_y1": 499.5, "r_x2": 448.0, "r_y2": 490.7, "r_x3": 151.7, "r_y3": 490.7, "coord_origin": "TOPLEFT" }, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Rectangular rule : The table representation is always rectangular - all rows must have an equal number of tokens, terminated with \"NL\" token." }, { "label": "text", "id": 0, "page_no": 6, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 512.6, "r": 480.6, "b": 640.9, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 521.4, "r_x1": 480.6, "r_y1": 521.4, "r_x2": 480.6, "r_y2": 512.6, "r_x3": 149.7, "r_y3": 512.6, "coord_origin": "TOPLEFT" }, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.5, "r_x3": 134.8, "r_y3": 524.5, "coord_origin": "TOPLEFT" }, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 480.6, "r_y1": 581.2, "r_x2": 480.6, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 480.6, "r_y1": 617.0, "r_x2": 480.6, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 134.8, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 311.2, "r_y1": 640.9, "r_x2": 311.2, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The application of these rules gives OTSL a set of unique properties. First of all, the OTSL enforces a strictly rectangular structure representation, where every new-line token starts a new row. As a consequence, all rows and all columns have exactly the same number of tokens, irrespective of cell spans. Secondly, the OTSL representation is unambiguous: Every table structure is represented in one way. In this representation every table cell corresponds to a \"C\"-cell token, which in case of spans is always located in the top-left corner of the table cell definition. Third, OTSL syntax rules are only backward-looking. As a consequence, every predicted token can be validated straight during sequence generation by looking at the previously predicted sequence. As such, OTSL can guarantee that every predicted sequence is syntactically valid." }, { "label": "text", "id": 2, "page_no": 6, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 644.1, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 149.7, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "These characteristics can be easily learned by sequence generator networks, as we demonstrate further below. We find strong indications that this pattern" } ], "headers": [ { "label": "page_header", "id": 7, "page_no": 6, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 11, "page_no": 6, "cluster": { "id": 11, "label": "page_header", "bbox": { "l": 476.0, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.87, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7" } ] } }, { "page_no": 7, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 163.6, "r_y1": 139.7, "r_x2": 163.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 170.4, "r_x1": 149.4, "r_y1": 170.4, "r_x2": 149.4, "r_y2": 161.6, "r_x3": 134.8, "r_y3": 161.6, "coord_origin": "TOPLEFT" }, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 170.4, "r_x1": 319.3, "r_y1": 170.4, "r_x2": 319.3, "r_y2": 161.6, "r_x3": 160.9, "r_y3": 161.6, "coord_origin": "TOPLEFT" }, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 191.1, "r_x1": 480.6, "r_y1": 191.1, "r_x2": 480.6, "r_y2": 182.3, "r_x3": 134.8, "r_y3": 182.3, "coord_origin": "TOPLEFT" }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 203.0, "r_x1": 480.6, "r_y1": 203.0, "r_x2": 480.6, "r_y2": 194.2, "r_x3": 134.8, "r_y3": 194.2, "coord_origin": "TOPLEFT" }, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 215.0, "r_x1": 480.6, "r_y1": 215.0, "r_x2": 480.6, "r_y2": 206.2, "r_x3": 134.8, "r_y3": 206.2, "coord_origin": "TOPLEFT" }, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 226.9, "r_x1": 480.6, "r_y1": 226.9, "r_x2": 480.6, "r_y2": 218.1, "r_x3": 134.8, "r_y3": 218.1, "coord_origin": "TOPLEFT" }, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 238.9, "r_x1": 480.6, "r_y1": 238.9, "r_x2": 480.6, "r_y2": 230.1, "r_x3": 134.8, "r_y3": 230.1, "coord_origin": "TOPLEFT" }, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 250.9, "r_x1": 480.6, "r_y1": 250.9, "r_x2": 480.6, "r_y2": 242.1, "r_x3": 134.8, "r_y3": 242.1, "coord_origin": "TOPLEFT" }, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 262.8, "r_x1": 480.6, "r_y1": 262.8, "r_x2": 480.6, "r_y2": 254.0, "r_x3": 134.8, "r_y3": 254.0, "coord_origin": "TOPLEFT" }, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 274.8, "r_x1": 480.6, "r_y1": 274.8, "r_x2": 480.6, "r_y2": 266.0, "r_x3": 134.8, "r_y3": 266.0, "coord_origin": "TOPLEFT" }, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 286.7, "r_x1": 480.6, "r_y1": 286.7, "r_x2": 480.6, "r_y2": 277.9, "r_x3": 134.8, "r_y3": 277.9, "coord_origin": "TOPLEFT" }, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 298.7, "r_x1": 469.4, "r_y1": 298.7, "r_x2": 469.4, "r_y2": 289.9, "r_x3": 134.8, "r_y3": 289.9, "coord_origin": "TOPLEFT" }, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.7, "r_x1": 141.5, "r_y1": 331.7, "r_x2": 141.5, "r_y2": 321.2, "r_x3": 134.8, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 331.7, "r_x1": 229.0, "r_y1": 331.7, "r_x2": 229.0, "r_y2": 321.2, "r_x3": 154.9, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 356.0, "r_x1": 480.6, "r_y1": 356.0, "r_x2": 480.6, "r_y2": 347.2, "r_x3": 134.8, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 368.0, "r_x1": 480.6, "r_y1": 368.0, "r_x2": 480.6, "r_y2": 359.2, "r_x3": 134.8, "r_y3": 359.2, "coord_origin": "TOPLEFT" }, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 380.0, "r_x1": 480.6, "r_y1": 380.0, "r_x2": 480.6, "r_y2": 371.2, "r_x3": 134.8, "r_y3": 371.2, "coord_origin": "TOPLEFT" }, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 391.9, "r_x1": 480.6, "r_y1": 391.9, "r_x2": 480.6, "r_y2": 383.1, "r_x3": 134.8, "r_y3": 383.1, "coord_origin": "TOPLEFT" }, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 403.9, "r_x1": 148.6, "r_y1": 403.9, "r_x2": 148.6, "r_y2": 395.1, "r_x3": 134.8, "r_y3": 395.1, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.6, "r_y0": 403.9, "r_x1": 191.8, "r_y1": 403.9, "r_x2": 191.8, "r_y2": 395.1, "r_x3": 151.6, "r_y3": 395.1, "coord_origin": "TOPLEFT" }, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 403.9, "r_x1": 480.6, "r_y1": 403.9, "r_x2": 480.6, "r_y2": 395.1, "r_x3": 195.9, "r_y3": 395.1, "coord_origin": "TOPLEFT" }, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 415.8, "r_x1": 480.6, "r_y1": 415.8, "r_x2": 480.6, "r_y2": 407.0, "r_x3": 134.8, "r_y3": 407.0, "coord_origin": "TOPLEFT" }, "text": "found in the first step and evaluate how OTSL impacts the performance of", "orig": "found in the first step and evaluate how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 427.8, "r_x1": 480.6, "r_y1": 427.8, "r_x2": 480.6, "r_y2": 419.0, "r_x3": 134.8, "r_y3": 419.0, "coord_origin": "TOPLEFT" }, "text": "TableFormer after training on other publicly available data sets (FinTabNet,", "orig": "TableFormer after training on other publicly available data sets (FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 439.7, "r_x1": 480.6, "r_y1": 439.7, "r_x2": 480.6, "r_y2": 430.9, "r_x3": 134.8, "r_y3": 430.9, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 451.7, "r_x1": 479.3, "r_y1": 451.7, "r_x2": 479.3, "r_y2": 442.9, "r_x3": 134.8, "r_y3": 442.9, "coord_origin": "TOPLEFT" }, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 492.6, "r_x1": 162.6, "r_y1": 492.6, "r_x2": 162.6, "r_y2": 484.6, "r_x3": 134.8, "r_y3": 484.6, "coord_origin": "TOPLEFT" }, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.2, "r_y0": 492.8, "r_x1": 480.6, "r_y1": 492.8, "r_x2": 480.6, "r_y2": 484.7, "r_x3": 165.2, "r_y3": 484.7, "coord_origin": "TOPLEFT" }, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 503.7, "r_x1": 206.7, "r_y1": 503.7, "r_x2": 206.7, "r_y2": 495.7, "r_x3": 134.8, "r_y3": 495.7, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.7, "r_y1": 543.1, "r_x2": 149.7, "r_y2": 540.7, "r_x3": 147.3, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 543.1, "r_x1": 155.7, "r_y1": 543.1, "r_x2": 155.7, "r_y2": 540.7, "r_x3": 150.9, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.8, "r_y0": 537.8, "r_x1": 172.3, "r_y1": 537.8, "r_x2": 172.3, "r_y2": 535.4, "r_x3": 162.8, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.6, "r_y0": 537.7, "r_x1": 155.9, "r_y1": 537.7, "r_x2": 155.9, "r_y2": 535.4, "r_x3": 147.6, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.7, "r_x3": 158.5, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 547.0, "r_x1": 162.7, "r_y1": 547.0, "r_x2": 162.7, "r_y2": 544.7, "r_x3": 158.5, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 551.3, "r_x1": 164.1, "r_y1": 551.3, "r_x2": 164.1, "r_y2": 548.9, "r_x3": 158.5, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 555.5, "r_x1": 162.7, "r_y1": 555.5, "r_x2": 162.7, "r_y2": 553.2, "r_x3": 158.5, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 543.1, "r_x1": 172.9, "r_y1": 543.1, "r_x2": 172.9, "r_y2": 540.7, "r_x3": 168.8, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 547.0, "r_x1": 172.9, "r_y1": 547.0, "r_x2": 172.9, "r_y2": 544.7, "r_x3": 168.8, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 551.3, "r_x1": 172.9, "r_y1": 551.3, "r_x2": 172.9, "r_y2": 548.9, "r_x3": 168.8, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 555.5, "r_x1": 172.9, "r_y1": 555.5, "r_x2": 172.9, "r_y2": 553.2, "r_x3": 168.8, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.0, "r_x1": 149.7, "r_y1": 547.0, "r_x2": 149.7, "r_y2": 544.7, "r_x3": 147.3, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 547.0, "r_x1": 155.7, "r_y1": 547.0, "r_x2": 155.7, "r_y2": 544.7, "r_x3": 150.9, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.3, "r_x1": 149.7, "r_y1": 551.3, "r_x2": 149.7, "r_y2": 548.9, "r_x3": 147.3, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 551.3, "r_x1": 155.7, "r_y1": 551.3, "r_x2": 155.7, "r_y2": 548.9, "r_x3": 150.9, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.5, "r_x1": 149.7, "r_y1": 555.5, "r_x2": 149.7, "r_y2": 553.2, "r_x3": 147.3, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 555.5, "r_x1": 155.7, "r_y1": 555.5, "r_x2": 155.7, "r_y2": 553.2, "r_x3": 150.9, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.1, "r_y0": 521.3, "r_x1": 171.2, "r_y1": 521.3, "r_x2": 171.2, "r_y2": 517.0, "r_x3": 152.1, "r_y3": 517.0, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.1, "r_y0": 526.6, "r_x1": 175.2, "r_y1": 526.6, "r_x2": 175.2, "r_y2": 522.3, "r_x3": 148.1, "r_y3": 522.3, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.5, "r_y0": 528.8, "r_x1": 220.3, "r_y1": 528.8, "r_x2": 220.3, "r_y2": 524.5, "r_x3": 193.5, "r_y3": 524.5, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.5, "r_y0": 534.1, "r_x1": 214.4, "r_y1": 534.1, "r_x2": 214.4, "r_y2": 529.8, "r_x3": 199.5, "r_y3": 529.8, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.6, "r_y0": 514.2, "r_x1": 284.5, "r_y1": 514.2, "r_x2": 284.5, "r_y2": 509.9, "r_x3": 273.6, "r_y3": 509.9, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 518.0, "r_x1": 287.6, "r_y1": 518.0, "r_x2": 287.6, "r_y2": 513.7, "r_x3": 270.5, "r_y3": 513.7, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.5, "r_y0": 512.4, "r_x1": 348.1, "r_y1": 512.4, "r_x2": 348.1, "r_y2": 508.1, "r_x3": 332.5, "r_y3": 508.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.7, "r_y0": 525.4, "r_x1": 407.3, "r_y1": 525.4, "r_x2": 407.3, "r_y2": 521.1, "r_x3": 376.7, "r_y3": 521.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.9, "r_y0": 529.9, "r_x1": 410.0, "r_y1": 529.9, "r_x2": 410.0, "r_y2": 525.7, "r_x3": 373.9, "r_y3": 525.7, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.5, "r_x1": 408.6, "r_y1": 534.5, "r_x2": 408.6, "r_y2": 530.2, "r_x3": 375.3, "r_y3": 530.2, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.1, "r_y0": 539.0, "r_x1": 406.9, "r_y1": 539.0, "r_x2": 406.9, "r_y2": 534.8, "r_x3": 377.1, "r_y3": 534.8, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.6, "r_y0": 567.5, "r_x1": 433.8, "r_y1": 567.5, "r_x2": 433.8, "r_y2": 563.2, "r_x3": 383.6, "r_y3": 563.2, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.5, "r_y0": 572.0, "r_x1": 433.8, "r_y1": 572.0, "r_x2": 433.8, "r_y2": 567.8, "r_x3": 383.5, "r_y3": 567.8, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.5, "r_y0": 576.6, "r_x1": 426.9, "r_y1": 576.6, "r_x2": 426.9, "r_y2": 572.3, "r_x3": 390.5, "r_y3": 572.3, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 582.2, "r_x1": 323.2, "r_y1": 582.2, "r_x2": 323.2, "r_y2": 577.9, "r_x3": 293.9, "r_y3": 577.9, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 586.7, "r_x1": 324.6, "r_y1": 586.7, "r_x2": 324.6, "r_y2": 582.4, "r_x3": 293.9, "r_y3": 582.4, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 546.1, "r_x1": 364.1, "r_y1": 546.1, "r_x2": 364.1, "r_y2": 541.8, "r_x3": 333.1, "r_y3": 541.8, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 549.9, "r_x1": 369.7, "r_y1": 549.9, "r_x2": 369.7, "r_y2": 545.6, "r_x3": 333.1, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.7, "r_y0": 519.5, "r_x1": 249.6, "r_y1": 519.5, "r_x2": 249.6, "r_y2": 515.2, "r_x3": 232.7, "r_y3": 515.2, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8, "r_y0": 550.2, "r_x1": 288.3, "r_y1": 550.2, "r_x2": 288.3, "r_y2": 546.0, "r_x3": 269.8, "r_y3": 546.0, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 554.0, "r_x1": 287.6, "r_y1": 554.0, "r_x2": 287.6, "r_y2": 549.8, "r_x3": 270.5, "r_y3": 549.8, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 520.2, "r_x1": 358.1, "r_y1": 520.2, "r_x2": 358.1, "r_y2": 515.9, "r_x3": 332.2, "r_y3": 515.9, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 526.2, "r_x1": 361.6, "r_y1": 526.2, "r_x2": 361.6, "r_y2": 522.0, "r_x3": 332.2, "r_y3": 522.0, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 532.3, "r_x1": 364.8, "r_y1": 532.3, "r_x2": 364.8, "r_y2": 528.0, "r_x3": 332.2, "r_y3": 528.0, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 538.4, "r_x1": 336.0, "r_y1": 538.4, "r_x2": 336.0, "r_y2": 534.1, "r_x3": 332.2, "r_y3": 534.1, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.9, "r_y0": 520.7, "r_x1": 329.4, "r_y1": 520.7, "r_x2": 329.4, "r_y2": 516.4, "r_x3": 326.9, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 526.7, "r_x1": 329.6, "r_y1": 526.7, "r_x2": 329.6, "r_y2": 522.4, "r_x3": 327.0, "r_y3": 522.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 532.8, "r_x1": 329.6, "r_y1": 532.8, "r_x2": 329.6, "r_y2": 528.5, "r_x3": 327.0, "r_y3": 528.5, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.1, "r_y0": 531.7, "r_x1": 426.7, "r_y1": 531.7, "r_x2": 426.7, "r_y2": 527.4, "r_x3": 424.1, "r_y3": 527.4, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.7, "r_x1": 455.5, "r_y1": 521.7, "r_x2": 455.5, "r_y2": 517.5, "r_x3": 453.0, "r_y3": 517.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.9, "r_y0": 521.3, "r_x1": 426.4, "r_y1": 521.3, "r_x2": 426.4, "r_y2": 517.1, "r_x3": 423.9, "r_y3": 517.1, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4, "r_y0": 562.4, "r_x1": 337.3, "r_y1": 562.4, "r_x2": 337.3, "r_y2": 557.4, "r_x3": 333.4, "r_y3": 557.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 562.3, "r_x1": 344.2, "r_y1": 562.3, "r_x2": 344.2, "r_y2": 557.3, "r_x3": 340.4, "r_y3": 557.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 568.9, "r_x1": 344.2, "r_y1": 568.9, "r_x2": 344.2, "r_y2": 563.9, "r_x3": 340.3, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.9, "r_x1": 350.6, "r_y1": 568.9, "r_x2": 350.6, "r_y2": 563.9, "r_x3": 346.8, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.8, "r_x1": 337.4, "r_y1": 568.8, "r_x2": 337.4, "r_y2": 563.8, "r_x3": 333.6, "r_y3": 563.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 575.4, "r_x1": 344.2, "r_y1": 575.4, "r_x2": 344.2, "r_y2": 570.4, "r_x3": 340.4, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 575.4, "r_x1": 350.7, "r_y1": 575.4, "r_x2": 350.7, "r_y2": 570.4, "r_x3": 346.9, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 575.4, "r_x1": 337.5, "r_y1": 575.4, "r_x2": 337.5, "r_y2": 570.4, "r_x3": 333.7, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 582.0, "r_x1": 344.2, "r_y1": 582.0, "r_x2": 344.2, "r_y2": 577.0, "r_x3": 340.4, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 582.0, "r_x1": 350.7, "r_y1": 582.0, "r_x2": 350.7, "r_y2": 577.0, "r_x3": 346.9, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 582.0, "r_x1": 337.5, "r_y1": 582.0, "r_x2": 337.5, "r_y2": 577.0, "r_x3": 333.7, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 588.4, "r_x1": 344.1, "r_y1": 588.4, "r_x2": 344.1, "r_y2": 583.4, "r_x3": 340.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 588.4, "r_x1": 350.6, "r_y1": 588.4, "r_x2": 350.6, "r_y2": 583.4, "r_x3": 346.8, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 588.3, "r_x1": 337.4, "r_y1": 588.3, "r_x2": 337.4, "r_y2": 583.4, "r_x3": 333.6, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.0, "r_y0": 561.9, "r_x1": 359.8, "r_y1": 561.9, "r_x2": 359.8, "r_y2": 556.9, "r_x3": 353.0, "r_y3": 556.9, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 568.6, "r_x1": 360.0, "r_y1": 568.6, "r_x2": 360.0, "r_y2": 563.6, "r_x3": 353.2, "r_y3": 563.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.2, "r_x1": 360.0, "r_y1": 575.2, "r_x2": 360.0, "r_y2": 570.2, "r_x3": 353.2, "r_y3": 570.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 581.8, "r_x1": 360.0, "r_y1": 581.8, "r_x2": 360.0, "r_y2": 576.8, "r_x3": 353.2, "r_y3": 576.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.3, "r_y0": 588.4, "r_x1": 360.1, "r_y1": 588.4, "r_x2": 360.1, "r_y2": 583.4, "r_x3": 353.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.4, "r_y0": 562.1, "r_x1": 350.3, "r_y1": 562.1, "r_x2": 350.3, "r_y2": 557.1, "r_x3": 347.4, "r_y3": 557.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.1, "r_y0": 568.6, "r_x1": 333.7, "r_y1": 568.6, "r_x2": 333.7, "r_y2": 564.3, "r_x3": 331.1, "r_y3": 564.3, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.8, "r_y0": 558.9, "r_x1": 343.3, "r_y1": 558.9, "r_x2": 343.3, "r_y2": 554.6, "r_x3": 340.8, "r_y3": 554.6, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.0, "r_y0": 559.1, "r_x1": 333.5, "r_y1": 559.1, "r_x2": 333.5, "r_y2": 554.8, "r_x3": 331.0, "r_y3": 554.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 149.7, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "cells. The predicted OTSL structures were converted back to HTML format in", "orig": "cells. The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 9, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 139.4, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.83, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 139.7, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 163.6, "r_y1": 139.7, "r_x2": 163.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "section_header", "bbox": { "l": 134.8, "t": 161.6, "r": 319.3, "b": 170.4, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 170.4, "r_x1": 149.4, "r_y1": 170.4, "r_x2": 149.4, "r_y2": 161.6, "r_x3": 134.8, "r_y3": 161.6, "coord_origin": "TOPLEFT" }, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 170.4, "r_x1": 319.3, "r_y1": 170.4, "r_x2": 319.3, "r_y2": 161.6, "r_x3": 160.9, "r_y3": 161.6, "coord_origin": "TOPLEFT" }, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 182.3, "r": 480.6, "b": 298.7, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 191.1, "r_x1": 480.6, "r_y1": 191.1, "r_x2": 480.6, "r_y2": 182.3, "r_x3": 134.8, "r_y3": 182.3, "coord_origin": "TOPLEFT" }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 203.0, "r_x1": 480.6, "r_y1": 203.0, "r_x2": 480.6, "r_y2": 194.2, "r_x3": 134.8, "r_y3": 194.2, "coord_origin": "TOPLEFT" }, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 215.0, "r_x1": 480.6, "r_y1": 215.0, "r_x2": 480.6, "r_y2": 206.2, "r_x3": 134.8, "r_y3": 206.2, "coord_origin": "TOPLEFT" }, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 226.9, "r_x1": 480.6, "r_y1": 226.9, "r_x2": 480.6, "r_y2": 218.1, "r_x3": 134.8, "r_y3": 218.1, "coord_origin": "TOPLEFT" }, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 238.9, "r_x1": 480.6, "r_y1": 238.9, "r_x2": 480.6, "r_y2": 230.1, "r_x3": 134.8, "r_y3": 230.1, "coord_origin": "TOPLEFT" }, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 250.9, "r_x1": 480.6, "r_y1": 250.9, "r_x2": 480.6, "r_y2": 242.1, "r_x3": 134.8, "r_y3": 242.1, "coord_origin": "TOPLEFT" }, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 262.8, "r_x1": 480.6, "r_y1": 262.8, "r_x2": 480.6, "r_y2": 254.0, "r_x3": 134.8, "r_y3": 254.0, "coord_origin": "TOPLEFT" }, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 274.8, "r_x1": 480.6, "r_y1": 274.8, "r_x2": 480.6, "r_y2": 266.0, "r_x3": 134.8, "r_y3": 266.0, "coord_origin": "TOPLEFT" }, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 286.7, "r_x1": 480.6, "r_y1": 286.7, "r_x2": 480.6, "r_y2": 277.9, "r_x3": 134.8, "r_y3": 277.9, "coord_origin": "TOPLEFT" }, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 298.7, "r_x1": 469.4, "r_y1": 298.7, "r_x2": 469.4, "r_y2": 289.9, "r_x3": 134.8, "r_y3": 289.9, "coord_origin": "TOPLEFT" }, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "section_header", "bbox": { "l": 134.8, "t": 321.2, "r": 229.0, "b": 331.7, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.7, "r_x1": 141.5, "r_y1": 331.7, "r_x2": 141.5, "r_y2": 321.2, "r_x3": 134.8, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 331.7, "r_x1": 229.0, "r_y1": 331.7, "r_x2": 229.0, "r_y2": 321.2, "r_x3": 154.9, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 347.2, "r": 480.6, "b": 451.7, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 356.0, "r_x1": 480.6, "r_y1": 356.0, "r_x2": 480.6, "r_y2": 347.2, "r_x3": 134.8, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 368.0, "r_x1": 480.6, "r_y1": 368.0, "r_x2": 480.6, "r_y2": 359.2, "r_x3": 134.8, "r_y3": 359.2, "coord_origin": "TOPLEFT" }, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 380.0, "r_x1": 480.6, "r_y1": 380.0, "r_x2": 480.6, "r_y2": 371.2, "r_x3": 134.8, "r_y3": 371.2, "coord_origin": "TOPLEFT" }, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 391.9, "r_x1": 480.6, "r_y1": 391.9, "r_x2": 480.6, "r_y2": 383.1, "r_x3": 134.8, "r_y3": 383.1, "coord_origin": "TOPLEFT" }, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 403.9, "r_x1": 148.6, "r_y1": 403.9, "r_x2": 148.6, "r_y2": 395.1, "r_x3": 134.8, "r_y3": 395.1, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.6, "r_y0": 403.9, "r_x1": 191.8, "r_y1": 403.9, "r_x2": 191.8, "r_y2": 395.1, "r_x3": 151.6, "r_y3": 395.1, "coord_origin": "TOPLEFT" }, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 403.9, "r_x1": 480.6, "r_y1": 403.9, "r_x2": 480.6, "r_y2": 395.1, "r_x3": 195.9, "r_y3": 395.1, "coord_origin": "TOPLEFT" }, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 415.8, "r_x1": 480.6, "r_y1": 415.8, "r_x2": 480.6, "r_y2": 407.0, "r_x3": 134.8, "r_y3": 407.0, "coord_origin": "TOPLEFT" }, "text": "found in the first step and evaluate how OTSL impacts the performance of", "orig": "found in the first step and evaluate how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 427.8, "r_x1": 480.6, "r_y1": 427.8, "r_x2": 480.6, "r_y2": 419.0, "r_x3": 134.8, "r_y3": 419.0, "coord_origin": "TOPLEFT" }, "text": "TableFormer after training on other publicly available data sets (FinTabNet,", "orig": "TableFormer after training on other publicly available data sets (FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 439.7, "r_x1": 480.6, "r_y1": 439.7, "r_x2": 480.6, "r_y2": 430.9, "r_x3": 134.8, "r_y3": 430.9, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 451.7, "r_x1": 479.3, "r_y1": 451.7, "r_x2": 479.3, "r_y2": 442.9, "r_x3": 134.8, "r_y3": 442.9, "coord_origin": "TOPLEFT" }, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "caption", "bbox": { "l": 134.8, "t": 484.6, "r": 480.6, "b": 503.7, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 492.6, "r_x1": 162.6, "r_y1": 492.6, "r_x2": 162.6, "r_y2": 484.6, "r_x3": 134.8, "r_y3": 484.6, "coord_origin": "TOPLEFT" }, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.2, "r_y0": 492.8, "r_x1": 480.6, "r_y1": 492.8, "r_x2": 480.6, "r_y2": 484.7, "r_x3": 165.2, "r_y3": 484.7, "coord_origin": "TOPLEFT" }, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 503.7, "r_x1": 206.7, "r_y1": 503.7, "r_x2": 206.7, "r_y2": 495.7, "r_x3": 134.8, "r_y3": 495.7, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "picture", "bbox": { "l": 140.7, "t": 508.1, "r": 472.7, "b": 593.7, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.7, "r_y1": 543.1, "r_x2": 149.7, "r_y2": 540.7, "r_x3": 147.3, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 543.1, "r_x1": 155.7, "r_y1": 543.1, "r_x2": 155.7, "r_y2": 540.7, "r_x3": 150.9, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.8, "r_y0": 537.8, "r_x1": 172.3, "r_y1": 537.8, "r_x2": 172.3, "r_y2": 535.4, "r_x3": 162.8, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.6, "r_y0": 537.7, "r_x1": 155.9, "r_y1": 537.7, "r_x2": 155.9, "r_y2": 535.4, "r_x3": 147.6, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.7, "r_x3": 158.5, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 547.0, "r_x1": 162.7, "r_y1": 547.0, "r_x2": 162.7, "r_y2": 544.7, "r_x3": 158.5, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 551.3, "r_x1": 164.1, "r_y1": 551.3, "r_x2": 164.1, "r_y2": 548.9, "r_x3": 158.5, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 555.5, "r_x1": 162.7, "r_y1": 555.5, "r_x2": 162.7, "r_y2": 553.2, "r_x3": 158.5, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 543.1, "r_x1": 172.9, "r_y1": 543.1, "r_x2": 172.9, "r_y2": 540.7, "r_x3": 168.8, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 547.0, "r_x1": 172.9, "r_y1": 547.0, "r_x2": 172.9, "r_y2": 544.7, "r_x3": 168.8, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 551.3, "r_x1": 172.9, "r_y1": 551.3, "r_x2": 172.9, "r_y2": 548.9, "r_x3": 168.8, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 555.5, "r_x1": 172.9, "r_y1": 555.5, "r_x2": 172.9, "r_y2": 553.2, "r_x3": 168.8, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.0, "r_x1": 149.7, "r_y1": 547.0, "r_x2": 149.7, "r_y2": 544.7, "r_x3": 147.3, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 547.0, "r_x1": 155.7, "r_y1": 547.0, "r_x2": 155.7, "r_y2": 544.7, "r_x3": 150.9, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.3, "r_x1": 149.7, "r_y1": 551.3, "r_x2": 149.7, "r_y2": 548.9, "r_x3": 147.3, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 551.3, "r_x1": 155.7, "r_y1": 551.3, "r_x2": 155.7, "r_y2": 548.9, "r_x3": 150.9, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.5, "r_x1": 149.7, "r_y1": 555.5, "r_x2": 149.7, "r_y2": 553.2, "r_x3": 147.3, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 555.5, "r_x1": 155.7, "r_y1": 555.5, "r_x2": 155.7, "r_y2": 553.2, "r_x3": 150.9, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.1, "r_y0": 521.3, "r_x1": 171.2, "r_y1": 521.3, "r_x2": 171.2, "r_y2": 517.0, "r_x3": 152.1, "r_y3": 517.0, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.1, "r_y0": 526.6, "r_x1": 175.2, "r_y1": 526.6, "r_x2": 175.2, "r_y2": 522.3, "r_x3": 148.1, "r_y3": 522.3, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.5, "r_y0": 528.8, "r_x1": 220.3, "r_y1": 528.8, "r_x2": 220.3, "r_y2": 524.5, "r_x3": 193.5, "r_y3": 524.5, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.5, "r_y0": 534.1, "r_x1": 214.4, "r_y1": 534.1, "r_x2": 214.4, "r_y2": 529.8, "r_x3": 199.5, "r_y3": 529.8, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.6, "r_y0": 514.2, "r_x1": 284.5, "r_y1": 514.2, "r_x2": 284.5, "r_y2": 509.9, "r_x3": 273.6, "r_y3": 509.9, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 518.0, "r_x1": 287.6, "r_y1": 518.0, "r_x2": 287.6, "r_y2": 513.7, "r_x3": 270.5, "r_y3": 513.7, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.5, "r_y0": 512.4, "r_x1": 348.1, "r_y1": 512.4, "r_x2": 348.1, "r_y2": 508.1, "r_x3": 332.5, "r_y3": 508.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.7, "r_y0": 525.4, "r_x1": 407.3, "r_y1": 525.4, "r_x2": 407.3, "r_y2": 521.1, "r_x3": 376.7, "r_y3": 521.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.9, "r_y0": 529.9, "r_x1": 410.0, "r_y1": 529.9, "r_x2": 410.0, "r_y2": 525.7, "r_x3": 373.9, "r_y3": 525.7, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.5, "r_x1": 408.6, "r_y1": 534.5, "r_x2": 408.6, "r_y2": 530.2, "r_x3": 375.3, "r_y3": 530.2, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.1, "r_y0": 539.0, "r_x1": 406.9, "r_y1": 539.0, "r_x2": 406.9, "r_y2": 534.8, "r_x3": 377.1, "r_y3": 534.8, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.6, "r_y0": 567.5, "r_x1": 433.8, "r_y1": 567.5, "r_x2": 433.8, "r_y2": 563.2, "r_x3": 383.6, "r_y3": 563.2, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.5, "r_y0": 572.0, "r_x1": 433.8, "r_y1": 572.0, "r_x2": 433.8, "r_y2": 567.8, "r_x3": 383.5, "r_y3": 567.8, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.5, "r_y0": 576.6, "r_x1": 426.9, "r_y1": 576.6, "r_x2": 426.9, "r_y2": 572.3, "r_x3": 390.5, "r_y3": 572.3, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 582.2, "r_x1": 323.2, "r_y1": 582.2, "r_x2": 323.2, "r_y2": 577.9, "r_x3": 293.9, "r_y3": 577.9, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 586.7, "r_x1": 324.6, "r_y1": 586.7, "r_x2": 324.6, "r_y2": 582.4, "r_x3": 293.9, "r_y3": 582.4, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 546.1, "r_x1": 364.1, "r_y1": 546.1, "r_x2": 364.1, "r_y2": 541.8, "r_x3": 333.1, "r_y3": 541.8, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 549.9, "r_x1": 369.7, "r_y1": 549.9, "r_x2": 369.7, "r_y2": 545.6, "r_x3": 333.1, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.7, "r_y0": 519.5, "r_x1": 249.6, "r_y1": 519.5, "r_x2": 249.6, "r_y2": 515.2, "r_x3": 232.7, "r_y3": 515.2, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8, "r_y0": 550.2, "r_x1": 288.3, "r_y1": 550.2, "r_x2": 288.3, "r_y2": 546.0, "r_x3": 269.8, "r_y3": 546.0, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 554.0, "r_x1": 287.6, "r_y1": 554.0, "r_x2": 287.6, "r_y2": 549.8, "r_x3": 270.5, "r_y3": 549.8, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 520.2, "r_x1": 358.1, "r_y1": 520.2, "r_x2": 358.1, "r_y2": 515.9, "r_x3": 332.2, "r_y3": 515.9, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 526.2, "r_x1": 361.6, "r_y1": 526.2, "r_x2": 361.6, "r_y2": 522.0, "r_x3": 332.2, "r_y3": 522.0, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 532.3, "r_x1": 364.8, "r_y1": 532.3, "r_x2": 364.8, "r_y2": 528.0, "r_x3": 332.2, "r_y3": 528.0, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 538.4, "r_x1": 336.0, "r_y1": 538.4, "r_x2": 336.0, "r_y2": 534.1, "r_x3": 332.2, "r_y3": 534.1, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.9, "r_y0": 520.7, "r_x1": 329.4, "r_y1": 520.7, "r_x2": 329.4, "r_y2": 516.4, "r_x3": 326.9, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 526.7, "r_x1": 329.6, "r_y1": 526.7, "r_x2": 329.6, "r_y2": 522.4, "r_x3": 327.0, "r_y3": 522.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 532.8, "r_x1": 329.6, "r_y1": 532.8, "r_x2": 329.6, "r_y2": 528.5, "r_x3": 327.0, "r_y3": 528.5, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.1, "r_y0": 531.7, "r_x1": 426.7, "r_y1": 531.7, "r_x2": 426.7, "r_y2": 527.4, "r_x3": 424.1, "r_y3": 527.4, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.7, "r_x1": 455.5, "r_y1": 521.7, "r_x2": 455.5, "r_y2": 517.5, "r_x3": 453.0, "r_y3": 517.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.9, "r_y0": 521.3, "r_x1": 426.4, "r_y1": 521.3, "r_x2": 426.4, "r_y2": 517.1, "r_x3": 423.9, "r_y3": 517.1, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4, "r_y0": 562.4, "r_x1": 337.3, "r_y1": 562.4, "r_x2": 337.3, "r_y2": 557.4, "r_x3": 333.4, "r_y3": 557.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 562.3, "r_x1": 344.2, "r_y1": 562.3, "r_x2": 344.2, "r_y2": 557.3, "r_x3": 340.4, "r_y3": 557.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 568.9, "r_x1": 344.2, "r_y1": 568.9, "r_x2": 344.2, "r_y2": 563.9, "r_x3": 340.3, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.9, "r_x1": 350.6, "r_y1": 568.9, "r_x2": 350.6, "r_y2": 563.9, "r_x3": 346.8, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.8, "r_x1": 337.4, "r_y1": 568.8, "r_x2": 337.4, "r_y2": 563.8, "r_x3": 333.6, "r_y3": 563.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 575.4, "r_x1": 344.2, "r_y1": 575.4, "r_x2": 344.2, "r_y2": 570.4, "r_x3": 340.4, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 575.4, "r_x1": 350.7, "r_y1": 575.4, "r_x2": 350.7, "r_y2": 570.4, "r_x3": 346.9, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 575.4, "r_x1": 337.5, "r_y1": 575.4, "r_x2": 337.5, "r_y2": 570.4, "r_x3": 333.7, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 582.0, "r_x1": 344.2, "r_y1": 582.0, "r_x2": 344.2, "r_y2": 577.0, "r_x3": 340.4, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 582.0, "r_x1": 350.7, "r_y1": 582.0, "r_x2": 350.7, "r_y2": 577.0, "r_x3": 346.9, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 582.0, "r_x1": 337.5, "r_y1": 582.0, "r_x2": 337.5, "r_y2": 577.0, "r_x3": 333.7, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 588.4, "r_x1": 344.1, "r_y1": 588.4, "r_x2": 344.1, "r_y2": 583.4, "r_x3": 340.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 588.4, "r_x1": 350.6, "r_y1": 588.4, "r_x2": 350.6, "r_y2": 583.4, "r_x3": 346.8, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 588.3, "r_x1": 337.4, "r_y1": 588.3, "r_x2": 337.4, "r_y2": 583.4, "r_x3": 333.6, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.0, "r_y0": 561.9, "r_x1": 359.8, "r_y1": 561.9, "r_x2": 359.8, "r_y2": 556.9, "r_x3": 353.0, "r_y3": 556.9, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 568.6, "r_x1": 360.0, "r_y1": 568.6, "r_x2": 360.0, "r_y2": 563.6, "r_x3": 353.2, "r_y3": 563.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.2, "r_x1": 360.0, "r_y1": 575.2, "r_x2": 360.0, "r_y2": 570.2, "r_x3": 353.2, "r_y3": 570.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 581.8, "r_x1": 360.0, "r_y1": 581.8, "r_x2": 360.0, "r_y2": 576.8, "r_x3": 353.2, "r_y3": 576.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.3, "r_y0": 588.4, "r_x1": 360.1, "r_y1": 588.4, "r_x2": 360.1, "r_y2": 583.4, "r_x3": 353.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.4, "r_y0": 562.1, "r_x1": 350.3, "r_y1": 562.1, "r_x2": 350.3, "r_y2": 557.1, "r_x3": 347.4, "r_y3": 557.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.1, "r_y0": 568.6, "r_x1": 333.7, "r_y1": 568.6, "r_x2": 333.7, "r_y2": 564.3, "r_x3": 331.1, "r_y3": 564.3, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.8, "r_y0": 558.9, "r_x1": 343.3, "r_y1": 558.9, "r_x2": 343.3, "r_y2": 554.6, "r_x3": 340.8, "r_y3": 554.6, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.0, "r_y0": 559.1, "r_x1": 333.5, "r_y1": 559.1, "r_x2": 333.5, "r_y2": 554.8, "r_x3": 331.0, "r_y3": 554.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 13, "label": "text", "bbox": { "l": 147.3, "t": 540.7, "r": 149.7, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.7, "r_y1": 543.1, "r_x2": 149.7, "r_y2": 540.7, "r_x3": 147.3, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 150.9, "t": 540.7, "r": 155.7, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 543.1, "r_x1": 155.7, "r_y1": 543.1, "r_x2": 155.7, "r_y2": 540.7, "r_x3": 150.9, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 162.8, "t": 535.4, "r": 172.3, "b": 537.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.8, "r_y0": 537.8, "r_x1": 172.3, "r_y1": 537.8, "r_x2": 172.3, "r_y2": 535.4, "r_x3": 162.8, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 147.6, "t": 535.4, "r": 155.9, "b": 537.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.6, "r_y0": 537.7, "r_x1": 155.9, "r_y1": 537.7, "r_x2": 155.9, "r_y2": 535.4, "r_x3": 147.6, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 158.5, "t": 540.7, "r": 164.1, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.7, "r_x3": 158.5, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 158.5, "t": 544.7, "r": 162.7, "b": 547.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 547.0, "r_x1": 162.7, "r_y1": 547.0, "r_x2": 162.7, "r_y2": 544.7, "r_x3": 158.5, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 158.5, "t": 548.9, "r": 164.1, "b": 551.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 551.3, "r_x1": 164.1, "r_y1": 551.3, "r_x2": 164.1, "r_y2": 548.9, "r_x3": 158.5, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 158.5, "t": 553.2, "r": 162.7, "b": 555.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 555.5, "r_x1": 162.7, "r_y1": 555.5, "r_x2": 162.7, "r_y2": 553.2, "r_x3": 158.5, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 168.8, "t": 540.7, "r": 172.9, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 543.1, "r_x1": 172.9, "r_y1": 543.1, "r_x2": 172.9, "r_y2": 540.7, "r_x3": 168.8, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 168.8, "t": 544.7, "r": 172.9, "b": 547.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 547.0, "r_x1": 172.9, "r_y1": 547.0, "r_x2": 172.9, "r_y2": 544.7, "r_x3": 168.8, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 168.8, "t": 548.9, "r": 172.9, "b": 551.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 551.3, "r_x1": 172.9, "r_y1": 551.3, "r_x2": 172.9, "r_y2": 548.9, "r_x3": 168.8, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 168.8, "t": 553.2, "r": 172.9, "b": 555.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 555.5, "r_x1": 172.9, "r_y1": 555.5, "r_x2": 172.9, "r_y2": 553.2, "r_x3": 168.8, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 147.3, "t": 544.7, "r": 149.7, "b": 547.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.0, "r_x1": 149.7, "r_y1": 547.0, "r_x2": 149.7, "r_y2": 544.7, "r_x3": 147.3, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 150.9, "t": 544.7, "r": 155.7, "b": 547.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 547.0, "r_x1": 155.7, "r_y1": 547.0, "r_x2": 155.7, "r_y2": 544.7, "r_x3": 150.9, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 147.3, "t": 548.9, "r": 149.7, "b": 551.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.3, "r_x1": 149.7, "r_y1": 551.3, "r_x2": 149.7, "r_y2": 548.9, "r_x3": 147.3, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 150.9, "t": 548.9, "r": 155.7, "b": 551.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 551.3, "r_x1": 155.7, "r_y1": 551.3, "r_x2": 155.7, "r_y2": 548.9, "r_x3": 150.9, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 147.3, "t": 553.2, "r": 149.7, "b": 555.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.5, "r_x1": 149.7, "r_y1": 555.5, "r_x2": 149.7, "r_y2": 553.2, "r_x3": 147.3, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 150.9, "t": 553.2, "r": 155.7, "b": 555.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 555.5, "r_x1": 155.7, "r_y1": 555.5, "r_x2": 155.7, "r_y2": 553.2, "r_x3": 150.9, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 152.1, "t": 517.0, "r": 171.2, "b": 521.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.1, "r_y0": 521.3, "r_x1": 171.2, "r_y1": 521.3, "r_x2": 171.2, "r_y2": 517.0, "r_x3": 152.1, "r_y3": 517.0, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 148.1, "t": 522.3, "r": 175.2, "b": 526.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.1, "r_y0": 526.6, "r_x1": 175.2, "r_y1": 526.6, "r_x2": 175.2, "r_y2": 522.3, "r_x3": 148.1, "r_y3": 522.3, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 193.5, "t": 524.5, "r": 220.3, "b": 528.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.5, "r_y0": 528.8, "r_x1": 220.3, "r_y1": 528.8, "r_x2": 220.3, "r_y2": 524.5, "r_x3": 193.5, "r_y3": 524.5, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 199.5, "t": 529.8, "r": 214.4, "b": 534.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.5, "r_y0": 534.1, "r_x1": 214.4, "r_y1": 534.1, "r_x2": 214.4, "r_y2": 529.8, "r_x3": 199.5, "r_y3": 529.8, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 273.6, "t": 509.9, "r": 284.5, "b": 514.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.6, "r_y0": 514.2, "r_x1": 284.5, "r_y1": 514.2, "r_x2": 284.5, "r_y2": 509.9, "r_x3": 273.6, "r_y3": 509.9, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 270.5, "t": 513.7, "r": 287.6, "b": 518.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 518.0, "r_x1": 287.6, "r_y1": 518.0, "r_x2": 287.6, "r_y2": 513.7, "r_x3": 270.5, "r_y3": 513.7, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 332.5, "t": 508.1, "r": 348.1, "b": 512.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.5, "r_y0": 512.4, "r_x1": 348.1, "r_y1": 512.4, "r_x2": 348.1, "r_y2": 508.1, "r_x3": 332.5, "r_y3": 508.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 376.7, "t": 521.1, "r": 407.3, "b": 525.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.7, "r_y0": 525.4, "r_x1": 407.3, "r_y1": 525.4, "r_x2": 407.3, "r_y2": 521.1, "r_x3": 376.7, "r_y3": 521.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 373.9, "t": 525.7, "r": 410.0, "b": 529.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.9, "r_y0": 529.9, "r_x1": 410.0, "r_y1": 529.9, "r_x2": 410.0, "r_y2": 525.7, "r_x3": 373.9, "r_y3": 525.7, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 375.3, "t": 530.2, "r": 408.6, "b": 534.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.5, "r_x1": 408.6, "r_y1": 534.5, "r_x2": 408.6, "r_y2": 530.2, "r_x3": 375.3, "r_y3": 530.2, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 377.1, "t": 534.8, "r": 406.9, "b": 539.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.1, "r_y0": 539.0, "r_x1": 406.9, "r_y1": 539.0, "r_x2": 406.9, "r_y2": 534.8, "r_x3": 377.1, "r_y3": 534.8, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 383.6, "t": 563.2, "r": 433.8, "b": 567.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.6, "r_y0": 567.5, "r_x1": 433.8, "r_y1": 567.5, "r_x2": 433.8, "r_y2": 563.2, "r_x3": 383.6, "r_y3": 563.2, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 383.5, "t": 567.8, "r": 433.8, "b": 572.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.5, "r_y0": 572.0, "r_x1": 433.8, "r_y1": 572.0, "r_x2": 433.8, "r_y2": 567.8, "r_x3": 383.5, "r_y3": 567.8, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 390.5, "t": 572.3, "r": 426.9, "b": 576.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.5, "r_y0": 576.6, "r_x1": 426.9, "r_y1": 576.6, "r_x2": 426.9, "r_y2": 572.3, "r_x3": 390.5, "r_y3": 572.3, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 293.9, "t": 577.9, "r": 323.2, "b": 582.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 582.2, "r_x1": 323.2, "r_y1": 582.2, "r_x2": 323.2, "r_y2": 577.9, "r_x3": 293.9, "r_y3": 577.9, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 293.9, "t": 582.4, "r": 324.6, "b": 586.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 586.7, "r_x1": 324.6, "r_y1": 586.7, "r_x2": 324.6, "r_y2": 582.4, "r_x3": 293.9, "r_y3": 582.4, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 333.1, "t": 541.8, "r": 364.1, "b": 546.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 546.1, "r_x1": 364.1, "r_y1": 546.1, "r_x2": 364.1, "r_y2": 541.8, "r_x3": 333.1, "r_y3": 541.8, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 333.1, "t": 545.6, "r": 369.7, "b": 549.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 549.9, "r_x1": 369.7, "r_y1": 549.9, "r_x2": 369.7, "r_y2": 545.6, "r_x3": 333.1, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 232.7, "t": 515.2, "r": 249.6, "b": 519.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.7, "r_y0": 519.5, "r_x1": 249.6, "r_y1": 519.5, "r_x2": 249.6, "r_y2": 515.2, "r_x3": 232.7, "r_y3": 515.2, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 269.8, "t": 546.0, "r": 288.3, "b": 550.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8, "r_y0": 550.2, "r_x1": 288.3, "r_y1": 550.2, "r_x2": 288.3, "r_y2": 546.0, "r_x3": 269.8, "r_y3": 546.0, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 270.5, "t": 549.8, "r": 287.6, "b": 554.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 554.0, "r_x1": 287.6, "r_y1": 554.0, "r_x2": 287.6, "r_y2": 549.8, "r_x3": 270.5, "r_y3": 549.8, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 332.2, "t": 515.9, "r": 358.1, "b": 520.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 520.2, "r_x1": 358.1, "r_y1": 520.2, "r_x2": 358.1, "r_y2": 515.9, "r_x3": 332.2, "r_y3": 515.9, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 332.2, "t": 522.0, "r": 361.6, "b": 526.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 526.2, "r_x1": 361.6, "r_y1": 526.2, "r_x2": 361.6, "r_y2": 522.0, "r_x3": 332.2, "r_y3": 522.0, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 332.2, "t": 528.0, "r": 364.8, "b": 532.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 532.3, "r_x1": 364.8, "r_y1": 532.3, "r_x2": 364.8, "r_y2": 528.0, "r_x3": 332.2, "r_y3": 528.0, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 332.2, "t": 534.1, "r": 336.0, "b": 538.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 538.4, "r_x1": 336.0, "r_y1": 538.4, "r_x2": 336.0, "r_y2": 534.1, "r_x3": 332.2, "r_y3": 534.1, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.9, "t": 516.4, "r": 329.4, "b": 520.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.9, "r_y0": 520.7, "r_x1": 329.4, "r_y1": 520.7, "r_x2": 329.4, "r_y2": 516.4, "r_x3": 326.9, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 327.0, "t": 522.4, "r": 329.6, "b": 526.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 526.7, "r_x1": 329.6, "r_y1": 526.7, "r_x2": 329.6, "r_y2": 522.4, "r_x3": 327.0, "r_y3": 522.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 327.0, "t": 528.5, "r": 329.6, "b": 532.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 532.8, "r_x1": 329.6, "r_y1": 532.8, "r_x2": 329.6, "r_y2": 528.5, "r_x3": 327.0, "r_y3": 528.5, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 424.1, "t": 527.4, "r": 426.7, "b": 531.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.1, "r_y0": 531.7, "r_x1": 426.7, "r_y1": 531.7, "r_x2": 426.7, "r_y2": 527.4, "r_x3": 424.1, "r_y3": 527.4, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 453.0, "t": 517.5, "r": 455.5, "b": 521.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.7, "r_x1": 455.5, "r_y1": 521.7, "r_x2": 455.5, "r_y2": 517.5, "r_x3": 453.0, "r_y3": 517.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 423.9, "t": 517.1, "r": 426.4, "b": 521.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.9, "r_y0": 521.3, "r_x1": 426.4, "r_y1": 521.3, "r_x2": 426.4, "r_y2": 517.1, "r_x3": 423.9, "r_y3": 517.1, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 333.4, "t": 557.4, "r": 337.3, "b": 562.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4, "r_y0": 562.4, "r_x1": 337.3, "r_y1": 562.4, "r_x2": 337.3, "r_y2": 557.4, "r_x3": 333.4, "r_y3": 557.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 340.4, "t": 557.3, "r": 344.2, "b": 562.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 562.3, "r_x1": 344.2, "r_y1": 562.3, "r_x2": 344.2, "r_y2": 557.3, "r_x3": 340.4, "r_y3": 557.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 340.3, "t": 563.9, "r": 344.2, "b": 568.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 568.9, "r_x1": 344.2, "r_y1": 568.9, "r_x2": 344.2, "r_y2": 563.9, "r_x3": 340.3, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 346.8, "t": 563.9, "r": 350.6, "b": 568.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.9, "r_x1": 350.6, "r_y1": 568.9, "r_x2": 350.6, "r_y2": 563.9, "r_x3": 346.8, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 333.6, "t": 563.8, "r": 337.4, "b": 568.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.8, "r_x1": 337.4, "r_y1": 568.8, "r_x2": 337.4, "r_y2": 563.8, "r_x3": 333.6, "r_y3": 563.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 340.4, "t": 570.4, "r": 344.2, "b": 575.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 575.4, "r_x1": 344.2, "r_y1": 575.4, "r_x2": 344.2, "r_y2": 570.4, "r_x3": 340.4, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 346.9, "t": 570.4, "r": 350.7, "b": 575.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 575.4, "r_x1": 350.7, "r_y1": 575.4, "r_x2": 350.7, "r_y2": 570.4, "r_x3": 346.9, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 333.7, "t": 570.4, "r": 337.5, "b": 575.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 575.4, "r_x1": 337.5, "r_y1": 575.4, "r_x2": 337.5, "r_y2": 570.4, "r_x3": 333.7, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 340.4, "t": 577.0, "r": 344.2, "b": 582.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 582.0, "r_x1": 344.2, "r_y1": 582.0, "r_x2": 344.2, "r_y2": 577.0, "r_x3": 340.4, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 346.9, "t": 577.0, "r": 350.7, "b": 582.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 582.0, "r_x1": 350.7, "r_y1": 582.0, "r_x2": 350.7, "r_y2": 577.0, "r_x3": 346.9, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 333.7, "t": 577.0, "r": 337.5, "b": 582.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 582.0, "r_x1": 337.5, "r_y1": 582.0, "r_x2": 337.5, "r_y2": 577.0, "r_x3": 333.7, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 340.3, "t": 583.4, "r": 344.1, "b": 588.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 588.4, "r_x1": 344.1, "r_y1": 588.4, "r_x2": 344.1, "r_y2": 583.4, "r_x3": 340.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 346.8, "t": 583.4, "r": 350.6, "b": 588.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 588.4, "r_x1": 350.6, "r_y1": 588.4, "r_x2": 350.6, "r_y2": 583.4, "r_x3": 346.8, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 333.6, "t": 583.4, "r": 337.4, "b": 588.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 588.3, "r_x1": 337.4, "r_y1": 588.3, "r_x2": 337.4, "r_y2": 583.4, "r_x3": 333.6, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 353.0, "t": 556.9, "r": 359.8, "b": 561.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.0, "r_y0": 561.9, "r_x1": 359.8, "r_y1": 561.9, "r_x2": 359.8, "r_y2": 556.9, "r_x3": 353.0, "r_y3": 556.9, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 353.2, "t": 563.6, "r": 360.0, "b": 568.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 568.6, "r_x1": 360.0, "r_y1": 568.6, "r_x2": 360.0, "r_y2": 563.6, "r_x3": 353.2, "r_y3": 563.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 353.2, "t": 570.2, "r": 360.0, "b": 575.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.2, "r_x1": 360.0, "r_y1": 575.2, "r_x2": 360.0, "r_y2": 570.2, "r_x3": 353.2, "r_y3": 570.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 353.2, "t": 576.8, "r": 360.0, "b": 581.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 581.8, "r_x1": 360.0, "r_y1": 581.8, "r_x2": 360.0, "r_y2": 576.8, "r_x3": 353.2, "r_y3": 576.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 353.3, "t": 583.4, "r": 360.1, "b": 588.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.3, "r_y0": 588.4, "r_x1": 360.1, "r_y1": 588.4, "r_x2": 360.1, "r_y2": 583.4, "r_x3": 353.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 347.4, "t": 557.1, "r": 350.3, "b": 562.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.4, "r_y0": 562.1, "r_x1": 350.3, "r_y1": 562.1, "r_x2": 350.3, "r_y2": 557.1, "r_x3": 347.4, "r_y3": 557.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 331.1, "t": 564.3, "r": 333.7, "b": 568.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.1, "r_y0": 568.6, "r_x1": 333.7, "r_y1": 568.6, "r_x2": 333.7, "r_y2": 564.3, "r_x3": 331.1, "r_y3": 564.3, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 340.8, "t": 554.6, "r": 343.3, "b": 558.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.8, "r_y0": 558.9, "r_x1": 343.3, "r_y1": 558.9, "r_x2": 343.3, "r_y2": 554.6, "r_x3": 340.8, "r_y3": 554.6, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 331.0, "t": 554.8, "r": 333.5, "b": 559.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.0, "r_y0": 559.1, "r_x1": 333.5, "r_y1": 559.1, "r_x2": 333.5, "r_y2": 554.8, "r_x3": 331.0, "r_y3": 554.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 4, "label": "text", "bbox": { "l": 134.8, "t": 620.2, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 149.7, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "cells. The predicted OTSL structures were converted back to HTML format in", "orig": "cells. The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 9, "page_no": 7, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 139.4, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.83, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8" }, { "label": "page_header", "id": 8, "page_no": 7, "cluster": { "id": 8, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "text", "id": 5, "page_no": 7, "cluster": { "id": 5, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 139.7, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 163.6, "r_y1": 139.7, "r_x2": 163.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "reduces significantly the column drift seen in the HTML based models (see Figure 5)." }, { "label": "section_header", "id": 2, "page_no": 7, "cluster": { "id": 2, "label": "section_header", "bbox": { "l": 134.8, "t": 161.6, "r": 319.3, "b": 170.4, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 170.4, "r_x1": 149.4, "r_y1": 170.4, "r_x2": 149.4, "r_y2": 161.6, "r_x3": 134.8, "r_y3": 161.6, "coord_origin": "TOPLEFT" }, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 170.4, "r_x1": 319.3, "r_y1": 170.4, "r_x2": 319.3, "r_y2": 161.6, "r_x3": 160.9, "r_y3": 161.6, "coord_origin": "TOPLEFT" }, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.3 Error-detection and -mitigation" }, { "label": "text", "id": 0, "page_no": 7, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 182.3, "r": 480.6, "b": 298.7, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 191.1, "r_x1": 480.6, "r_y1": 191.1, "r_x2": 480.6, "r_y2": 182.3, "r_x3": 134.8, "r_y3": 182.3, "coord_origin": "TOPLEFT" }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 203.0, "r_x1": 480.6, "r_y1": 203.0, "r_x2": 480.6, "r_y2": 194.2, "r_x3": 134.8, "r_y3": 194.2, "coord_origin": "TOPLEFT" }, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 215.0, "r_x1": 480.6, "r_y1": 215.0, "r_x2": 480.6, "r_y2": 206.2, "r_x3": 134.8, "r_y3": 206.2, "coord_origin": "TOPLEFT" }, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 226.9, "r_x1": 480.6, "r_y1": 226.9, "r_x2": 480.6, "r_y2": 218.1, "r_x3": 134.8, "r_y3": 218.1, "coord_origin": "TOPLEFT" }, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 238.9, "r_x1": 480.6, "r_y1": 238.9, "r_x2": 480.6, "r_y2": 230.1, "r_x3": 134.8, "r_y3": 230.1, "coord_origin": "TOPLEFT" }, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 250.9, "r_x1": 480.6, "r_y1": 250.9, "r_x2": 480.6, "r_y2": 242.1, "r_x3": 134.8, "r_y3": 242.1, "coord_origin": "TOPLEFT" }, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 262.8, "r_x1": 480.6, "r_y1": 262.8, "r_x2": 480.6, "r_y2": 254.0, "r_x3": 134.8, "r_y3": 254.0, "coord_origin": "TOPLEFT" }, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 274.8, "r_x1": 480.6, "r_y1": 274.8, "r_x2": 480.6, "r_y2": 266.0, "r_x3": 134.8, "r_y3": 266.0, "coord_origin": "TOPLEFT" }, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 286.7, "r_x1": 480.6, "r_y1": 286.7, "r_x2": 480.6, "r_y2": 277.9, "r_x3": 134.8, "r_y3": 277.9, "coord_origin": "TOPLEFT" }, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 298.7, "r_x1": 469.4, "r_y1": 298.7, "r_x2": 469.4, "r_y2": 289.9, "r_x3": 134.8, "r_y3": 289.9, "coord_origin": "TOPLEFT" }, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished sequence. The detection of an invalid sequence token is a clear indication of a prediction mistake, however a valid sequence by itself does not guarantee prediction correctness. Different heuristics can be used to correct token errors in an invalid sequence and thus increase the chances for accurate predictions. Such heuristics can be applied either after the prediction of each token, or at the end on the entire predicted sequence. For example a simple heuristic which can correct the predicted OTSL sequence on-the-fly is to verify if the token with the highest prediction confidence invalidates the predicted sequence, and replace it by the token with the next highest confidence until OTSL rules are satisfied." }, { "label": "section_header", "id": 3, "page_no": 7, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.8, "t": 321.2, "r": 229.0, "b": 331.7, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.7, "r_x1": 141.5, "r_y1": 331.7, "r_x2": 141.5, "r_y2": 321.2, "r_x3": 134.8, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 331.7, "r_x1": 229.0, "r_y1": 331.7, "r_x2": 229.0, "r_y2": 321.2, "r_x3": 154.9, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5 Experiments" }, { "label": "text", "id": 1, "page_no": 7, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 347.2, "r": 480.6, "b": 451.7, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 356.0, "r_x1": 480.6, "r_y1": 356.0, "r_x2": 480.6, "r_y2": 347.2, "r_x3": 134.8, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 368.0, "r_x1": 480.6, "r_y1": 368.0, "r_x2": 480.6, "r_y2": 359.2, "r_x3": 134.8, "r_y3": 359.2, "coord_origin": "TOPLEFT" }, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 380.0, "r_x1": 480.6, "r_y1": 380.0, "r_x2": 480.6, "r_y2": 371.2, "r_x3": 134.8, "r_y3": 371.2, "coord_origin": "TOPLEFT" }, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 391.9, "r_x1": 480.6, "r_y1": 391.9, "r_x2": 480.6, "r_y2": 383.1, "r_x3": 134.8, "r_y3": 383.1, "coord_origin": "TOPLEFT" }, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 403.9, "r_x1": 148.6, "r_y1": 403.9, "r_x2": 148.6, "r_y2": 395.1, "r_x3": 134.8, "r_y3": 395.1, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.6, "r_y0": 403.9, "r_x1": 191.8, "r_y1": 403.9, "r_x2": 191.8, "r_y2": 395.1, "r_x3": 151.6, "r_y3": 395.1, "coord_origin": "TOPLEFT" }, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 403.9, "r_x1": 480.6, "r_y1": 403.9, "r_x2": 480.6, "r_y2": 395.1, "r_x3": 195.9, "r_y3": 395.1, "coord_origin": "TOPLEFT" }, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 415.8, "r_x1": 480.6, "r_y1": 415.8, "r_x2": 480.6, "r_y2": 407.0, "r_x3": 134.8, "r_y3": 407.0, "coord_origin": "TOPLEFT" }, "text": "found in the first step and evaluate how OTSL impacts the performance of", "orig": "found in the first step and evaluate how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 427.8, "r_x1": 480.6, "r_y1": 427.8, "r_x2": 480.6, "r_y2": 419.0, "r_x3": 134.8, "r_y3": 419.0, "coord_origin": "TOPLEFT" }, "text": "TableFormer after training on other publicly available data sets (FinTabNet,", "orig": "TableFormer after training on other publicly available data sets (FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 439.7, "r_x1": 480.6, "r_y1": 439.7, "r_x2": 480.6, "r_y2": 430.9, "r_x3": 134.8, "r_y3": 430.9, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 451.7, "r_x1": 479.3, "r_y1": 451.7, "r_x2": 479.3, "r_y2": 442.9, "r_x3": 134.8, "r_y3": 442.9, "coord_origin": "TOPLEFT" }, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we conducted a series of experiments based on the TableFormer model (Figure 4) with two objectives: Firstly we evaluate the prediction quality and performance of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on the canonical PubTabNet data set. Secondly we pick the best hyper-parameters found in the first step and evaluate how OTSL impacts the performance of TableFormer after training on other publicly available data sets (FinTabNet, PubTables-1M [14]). The ground truth (GT) from all data sets has been converted into OTSL format for this purpose, and will be made publicly available." }, { "label": "caption", "id": 7, "page_no": 7, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 134.8, "t": 484.6, "r": 480.6, "b": 503.7, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 492.6, "r_x1": 162.6, "r_y1": 492.6, "r_x2": 162.6, "r_y2": 484.6, "r_x3": 134.8, "r_y3": 484.6, "coord_origin": "TOPLEFT" }, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.2, "r_y0": 492.8, "r_x1": 480.6, "r_y1": 492.8, "r_x2": 480.6, "r_y2": 484.7, "r_x3": 165.2, "r_y3": 484.7, "coord_origin": "TOPLEFT" }, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 503.7, "r_x1": 206.7, "r_y1": 503.7, "r_x2": 206.7, "r_y2": 495.7, "r_x3": 134.8, "r_y3": 495.7, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 4. Architecture sketch of the TableFormer model, which is a representative for the Im2Seq approach." }, { "label": "picture", "id": 6, "page_no": 7, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 140.7, "t": 508.1, "r": 472.7, "b": 593.7, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.7, "r_y1": 543.1, "r_x2": 149.7, "r_y2": 540.7, "r_x3": 147.3, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 543.1, "r_x1": 155.7, "r_y1": 543.1, "r_x2": 155.7, "r_y2": 540.7, "r_x3": 150.9, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.8, "r_y0": 537.8, "r_x1": 172.3, "r_y1": 537.8, "r_x2": 172.3, "r_y2": 535.4, "r_x3": 162.8, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.6, "r_y0": 537.7, "r_x1": 155.9, "r_y1": 537.7, "r_x2": 155.9, "r_y2": 535.4, "r_x3": 147.6, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.7, "r_x3": 158.5, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 547.0, "r_x1": 162.7, "r_y1": 547.0, "r_x2": 162.7, "r_y2": 544.7, "r_x3": 158.5, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 551.3, "r_x1": 164.1, "r_y1": 551.3, "r_x2": 164.1, "r_y2": 548.9, "r_x3": 158.5, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 555.5, "r_x1": 162.7, "r_y1": 555.5, "r_x2": 162.7, "r_y2": 553.2, "r_x3": 158.5, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 543.1, "r_x1": 172.9, "r_y1": 543.1, "r_x2": 172.9, "r_y2": 540.7, "r_x3": 168.8, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 547.0, "r_x1": 172.9, "r_y1": 547.0, "r_x2": 172.9, "r_y2": 544.7, "r_x3": 168.8, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 551.3, "r_x1": 172.9, "r_y1": 551.3, "r_x2": 172.9, "r_y2": 548.9, "r_x3": 168.8, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 555.5, "r_x1": 172.9, "r_y1": 555.5, "r_x2": 172.9, "r_y2": 553.2, "r_x3": 168.8, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.0, "r_x1": 149.7, "r_y1": 547.0, "r_x2": 149.7, "r_y2": 544.7, "r_x3": 147.3, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 547.0, "r_x1": 155.7, "r_y1": 547.0, "r_x2": 155.7, "r_y2": 544.7, "r_x3": 150.9, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.3, "r_x1": 149.7, "r_y1": 551.3, "r_x2": 149.7, "r_y2": 548.9, "r_x3": 147.3, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 551.3, "r_x1": 155.7, "r_y1": 551.3, "r_x2": 155.7, "r_y2": 548.9, "r_x3": 150.9, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.5, "r_x1": 149.7, "r_y1": 555.5, "r_x2": 149.7, "r_y2": 553.2, "r_x3": 147.3, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 555.5, "r_x1": 155.7, "r_y1": 555.5, "r_x2": 155.7, "r_y2": 553.2, "r_x3": 150.9, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.1, "r_y0": 521.3, "r_x1": 171.2, "r_y1": 521.3, "r_x2": 171.2, "r_y2": 517.0, "r_x3": 152.1, "r_y3": 517.0, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.1, "r_y0": 526.6, "r_x1": 175.2, "r_y1": 526.6, "r_x2": 175.2, "r_y2": 522.3, "r_x3": 148.1, "r_y3": 522.3, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.5, "r_y0": 528.8, "r_x1": 220.3, "r_y1": 528.8, "r_x2": 220.3, "r_y2": 524.5, "r_x3": 193.5, "r_y3": 524.5, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.5, "r_y0": 534.1, "r_x1": 214.4, "r_y1": 534.1, "r_x2": 214.4, "r_y2": 529.8, "r_x3": 199.5, "r_y3": 529.8, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.6, "r_y0": 514.2, "r_x1": 284.5, "r_y1": 514.2, "r_x2": 284.5, "r_y2": 509.9, "r_x3": 273.6, "r_y3": 509.9, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 518.0, "r_x1": 287.6, "r_y1": 518.0, "r_x2": 287.6, "r_y2": 513.7, "r_x3": 270.5, "r_y3": 513.7, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.5, "r_y0": 512.4, "r_x1": 348.1, "r_y1": 512.4, "r_x2": 348.1, "r_y2": 508.1, "r_x3": 332.5, "r_y3": 508.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.7, "r_y0": 525.4, "r_x1": 407.3, "r_y1": 525.4, "r_x2": 407.3, "r_y2": 521.1, "r_x3": 376.7, "r_y3": 521.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.9, "r_y0": 529.9, "r_x1": 410.0, "r_y1": 529.9, "r_x2": 410.0, "r_y2": 525.7, "r_x3": 373.9, "r_y3": 525.7, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.5, "r_x1": 408.6, "r_y1": 534.5, "r_x2": 408.6, "r_y2": 530.2, "r_x3": 375.3, "r_y3": 530.2, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.1, "r_y0": 539.0, "r_x1": 406.9, "r_y1": 539.0, "r_x2": 406.9, "r_y2": 534.8, "r_x3": 377.1, "r_y3": 534.8, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.6, "r_y0": 567.5, "r_x1": 433.8, "r_y1": 567.5, "r_x2": 433.8, "r_y2": 563.2, "r_x3": 383.6, "r_y3": 563.2, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.5, "r_y0": 572.0, "r_x1": 433.8, "r_y1": 572.0, "r_x2": 433.8, "r_y2": 567.8, "r_x3": 383.5, "r_y3": 567.8, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.5, "r_y0": 576.6, "r_x1": 426.9, "r_y1": 576.6, "r_x2": 426.9, "r_y2": 572.3, "r_x3": 390.5, "r_y3": 572.3, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 582.2, "r_x1": 323.2, "r_y1": 582.2, "r_x2": 323.2, "r_y2": 577.9, "r_x3": 293.9, "r_y3": 577.9, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 586.7, "r_x1": 324.6, "r_y1": 586.7, "r_x2": 324.6, "r_y2": 582.4, "r_x3": 293.9, "r_y3": 582.4, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 546.1, "r_x1": 364.1, "r_y1": 546.1, "r_x2": 364.1, "r_y2": 541.8, "r_x3": 333.1, "r_y3": 541.8, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 549.9, "r_x1": 369.7, "r_y1": 549.9, "r_x2": 369.7, "r_y2": 545.6, "r_x3": 333.1, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.7, "r_y0": 519.5, "r_x1": 249.6, "r_y1": 519.5, "r_x2": 249.6, "r_y2": 515.2, "r_x3": 232.7, "r_y3": 515.2, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8, "r_y0": 550.2, "r_x1": 288.3, "r_y1": 550.2, "r_x2": 288.3, "r_y2": 546.0, "r_x3": 269.8, "r_y3": 546.0, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 554.0, "r_x1": 287.6, "r_y1": 554.0, "r_x2": 287.6, "r_y2": 549.8, "r_x3": 270.5, "r_y3": 549.8, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 520.2, "r_x1": 358.1, "r_y1": 520.2, "r_x2": 358.1, "r_y2": 515.9, "r_x3": 332.2, "r_y3": 515.9, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 526.2, "r_x1": 361.6, "r_y1": 526.2, "r_x2": 361.6, "r_y2": 522.0, "r_x3": 332.2, "r_y3": 522.0, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 532.3, "r_x1": 364.8, "r_y1": 532.3, "r_x2": 364.8, "r_y2": 528.0, "r_x3": 332.2, "r_y3": 528.0, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 538.4, "r_x1": 336.0, "r_y1": 538.4, "r_x2": 336.0, "r_y2": 534.1, "r_x3": 332.2, "r_y3": 534.1, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.9, "r_y0": 520.7, "r_x1": 329.4, "r_y1": 520.7, "r_x2": 329.4, "r_y2": 516.4, "r_x3": 326.9, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 526.7, "r_x1": 329.6, "r_y1": 526.7, "r_x2": 329.6, "r_y2": 522.4, "r_x3": 327.0, "r_y3": 522.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 532.8, "r_x1": 329.6, "r_y1": 532.8, "r_x2": 329.6, "r_y2": 528.5, "r_x3": 327.0, "r_y3": 528.5, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.1, "r_y0": 531.7, "r_x1": 426.7, "r_y1": 531.7, "r_x2": 426.7, "r_y2": 527.4, "r_x3": 424.1, "r_y3": 527.4, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.7, "r_x1": 455.5, "r_y1": 521.7, "r_x2": 455.5, "r_y2": 517.5, "r_x3": 453.0, "r_y3": 517.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.9, "r_y0": 521.3, "r_x1": 426.4, "r_y1": 521.3, "r_x2": 426.4, "r_y2": 517.1, "r_x3": 423.9, "r_y3": 517.1, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4, "r_y0": 562.4, "r_x1": 337.3, "r_y1": 562.4, "r_x2": 337.3, "r_y2": 557.4, "r_x3": 333.4, "r_y3": 557.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 562.3, "r_x1": 344.2, "r_y1": 562.3, "r_x2": 344.2, "r_y2": 557.3, "r_x3": 340.4, "r_y3": 557.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 568.9, "r_x1": 344.2, "r_y1": 568.9, "r_x2": 344.2, "r_y2": 563.9, "r_x3": 340.3, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.9, "r_x1": 350.6, "r_y1": 568.9, "r_x2": 350.6, "r_y2": 563.9, "r_x3": 346.8, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.8, "r_x1": 337.4, "r_y1": 568.8, "r_x2": 337.4, "r_y2": 563.8, "r_x3": 333.6, "r_y3": 563.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 575.4, "r_x1": 344.2, "r_y1": 575.4, "r_x2": 344.2, "r_y2": 570.4, "r_x3": 340.4, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 575.4, "r_x1": 350.7, "r_y1": 575.4, "r_x2": 350.7, "r_y2": 570.4, "r_x3": 346.9, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 575.4, "r_x1": 337.5, "r_y1": 575.4, "r_x2": 337.5, "r_y2": 570.4, "r_x3": 333.7, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 582.0, "r_x1": 344.2, "r_y1": 582.0, "r_x2": 344.2, "r_y2": 577.0, "r_x3": 340.4, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 582.0, "r_x1": 350.7, "r_y1": 582.0, "r_x2": 350.7, "r_y2": 577.0, "r_x3": 346.9, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 582.0, "r_x1": 337.5, "r_y1": 582.0, "r_x2": 337.5, "r_y2": 577.0, "r_x3": 333.7, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 588.4, "r_x1": 344.1, "r_y1": 588.4, "r_x2": 344.1, "r_y2": 583.4, "r_x3": 340.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 588.4, "r_x1": 350.6, "r_y1": 588.4, "r_x2": 350.6, "r_y2": 583.4, "r_x3": 346.8, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 588.3, "r_x1": 337.4, "r_y1": 588.3, "r_x2": 337.4, "r_y2": 583.4, "r_x3": 333.6, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.0, "r_y0": 561.9, "r_x1": 359.8, "r_y1": 561.9, "r_x2": 359.8, "r_y2": 556.9, "r_x3": 353.0, "r_y3": 556.9, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 568.6, "r_x1": 360.0, "r_y1": 568.6, "r_x2": 360.0, "r_y2": 563.6, "r_x3": 353.2, "r_y3": 563.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.2, "r_x1": 360.0, "r_y1": 575.2, "r_x2": 360.0, "r_y2": 570.2, "r_x3": 353.2, "r_y3": 570.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 581.8, "r_x1": 360.0, "r_y1": 581.8, "r_x2": 360.0, "r_y2": 576.8, "r_x3": 353.2, "r_y3": 576.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.3, "r_y0": 588.4, "r_x1": 360.1, "r_y1": 588.4, "r_x2": 360.1, "r_y2": 583.4, "r_x3": 353.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.4, "r_y0": 562.1, "r_x1": 350.3, "r_y1": 562.1, "r_x2": 350.3, "r_y2": 557.1, "r_x3": 347.4, "r_y3": 557.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.1, "r_y0": 568.6, "r_x1": 333.7, "r_y1": 568.6, "r_x2": 333.7, "r_y2": 564.3, "r_x3": 331.1, "r_y3": 564.3, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.8, "r_y0": 558.9, "r_x1": 343.3, "r_y1": 558.9, "r_x2": 343.3, "r_y2": 554.6, "r_x3": 340.8, "r_y3": 554.6, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.0, "r_y0": 559.1, "r_x1": 333.5, "r_y1": 559.1, "r_x2": 333.5, "r_y2": 554.8, "r_x3": 331.0, "r_y3": 554.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 13, "label": "text", "bbox": { "l": 147.3, "t": 540.7, "r": 149.7, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.7, "r_y1": 543.1, "r_x2": 149.7, "r_y2": 540.7, "r_x3": 147.3, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 150.9, "t": 540.7, "r": 155.7, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 543.1, "r_x1": 155.7, "r_y1": 543.1, "r_x2": 155.7, "r_y2": 540.7, "r_x3": 150.9, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 162.8, "t": 535.4, "r": 172.3, "b": 537.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.8, "r_y0": 537.8, "r_x1": 172.3, "r_y1": 537.8, "r_x2": 172.3, "r_y2": 535.4, "r_x3": 162.8, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 147.6, "t": 535.4, "r": 155.9, "b": 537.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.6, "r_y0": 537.7, "r_x1": 155.9, "r_y1": 537.7, "r_x2": 155.9, "r_y2": 535.4, "r_x3": 147.6, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 158.5, "t": 540.7, "r": 164.1, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.7, "r_x3": 158.5, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 158.5, "t": 544.7, "r": 162.7, "b": 547.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 547.0, "r_x1": 162.7, "r_y1": 547.0, "r_x2": 162.7, "r_y2": 544.7, "r_x3": 158.5, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 158.5, "t": 548.9, "r": 164.1, "b": 551.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 551.3, "r_x1": 164.1, "r_y1": 551.3, "r_x2": 164.1, "r_y2": 548.9, "r_x3": 158.5, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 158.5, "t": 553.2, "r": 162.7, "b": 555.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 555.5, "r_x1": 162.7, "r_y1": 555.5, "r_x2": 162.7, "r_y2": 553.2, "r_x3": 158.5, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 168.8, "t": 540.7, "r": 172.9, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 543.1, "r_x1": 172.9, "r_y1": 543.1, "r_x2": 172.9, "r_y2": 540.7, "r_x3": 168.8, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 168.8, "t": 544.7, "r": 172.9, "b": 547.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 547.0, "r_x1": 172.9, "r_y1": 547.0, "r_x2": 172.9, "r_y2": 544.7, "r_x3": 168.8, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 168.8, "t": 548.9, "r": 172.9, "b": 551.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 551.3, "r_x1": 172.9, "r_y1": 551.3, "r_x2": 172.9, "r_y2": 548.9, "r_x3": 168.8, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 168.8, "t": 553.2, "r": 172.9, "b": 555.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 555.5, "r_x1": 172.9, "r_y1": 555.5, "r_x2": 172.9, "r_y2": 553.2, "r_x3": 168.8, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 147.3, "t": 544.7, "r": 149.7, "b": 547.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.0, "r_x1": 149.7, "r_y1": 547.0, "r_x2": 149.7, "r_y2": 544.7, "r_x3": 147.3, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 150.9, "t": 544.7, "r": 155.7, "b": 547.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 547.0, "r_x1": 155.7, "r_y1": 547.0, "r_x2": 155.7, "r_y2": 544.7, "r_x3": 150.9, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 147.3, "t": 548.9, "r": 149.7, "b": 551.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.3, "r_x1": 149.7, "r_y1": 551.3, "r_x2": 149.7, "r_y2": 548.9, "r_x3": 147.3, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 150.9, "t": 548.9, "r": 155.7, "b": 551.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 551.3, "r_x1": 155.7, "r_y1": 551.3, "r_x2": 155.7, "r_y2": 548.9, "r_x3": 150.9, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 147.3, "t": 553.2, "r": 149.7, "b": 555.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.5, "r_x1": 149.7, "r_y1": 555.5, "r_x2": 149.7, "r_y2": 553.2, "r_x3": 147.3, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 150.9, "t": 553.2, "r": 155.7, "b": 555.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 555.5, "r_x1": 155.7, "r_y1": 555.5, "r_x2": 155.7, "r_y2": 553.2, "r_x3": 150.9, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 152.1, "t": 517.0, "r": 171.2, "b": 521.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.1, "r_y0": 521.3, "r_x1": 171.2, "r_y1": 521.3, "r_x2": 171.2, "r_y2": 517.0, "r_x3": 152.1, "r_y3": 517.0, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 148.1, "t": 522.3, "r": 175.2, "b": 526.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.1, "r_y0": 526.6, "r_x1": 175.2, "r_y1": 526.6, "r_x2": 175.2, "r_y2": 522.3, "r_x3": 148.1, "r_y3": 522.3, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 193.5, "t": 524.5, "r": 220.3, "b": 528.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.5, "r_y0": 528.8, "r_x1": 220.3, "r_y1": 528.8, "r_x2": 220.3, "r_y2": 524.5, "r_x3": 193.5, "r_y3": 524.5, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 199.5, "t": 529.8, "r": 214.4, "b": 534.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.5, "r_y0": 534.1, "r_x1": 214.4, "r_y1": 534.1, "r_x2": 214.4, "r_y2": 529.8, "r_x3": 199.5, "r_y3": 529.8, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 273.6, "t": 509.9, "r": 284.5, "b": 514.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.6, "r_y0": 514.2, "r_x1": 284.5, "r_y1": 514.2, "r_x2": 284.5, "r_y2": 509.9, "r_x3": 273.6, "r_y3": 509.9, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 270.5, "t": 513.7, "r": 287.6, "b": 518.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 518.0, "r_x1": 287.6, "r_y1": 518.0, "r_x2": 287.6, "r_y2": 513.7, "r_x3": 270.5, "r_y3": 513.7, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 332.5, "t": 508.1, "r": 348.1, "b": 512.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.5, "r_y0": 512.4, "r_x1": 348.1, "r_y1": 512.4, "r_x2": 348.1, "r_y2": 508.1, "r_x3": 332.5, "r_y3": 508.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 376.7, "t": 521.1, "r": 407.3, "b": 525.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.7, "r_y0": 525.4, "r_x1": 407.3, "r_y1": 525.4, "r_x2": 407.3, "r_y2": 521.1, "r_x3": 376.7, "r_y3": 521.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 373.9, "t": 525.7, "r": 410.0, "b": 529.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.9, "r_y0": 529.9, "r_x1": 410.0, "r_y1": 529.9, "r_x2": 410.0, "r_y2": 525.7, "r_x3": 373.9, "r_y3": 525.7, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 375.3, "t": 530.2, "r": 408.6, "b": 534.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.5, "r_x1": 408.6, "r_y1": 534.5, "r_x2": 408.6, "r_y2": 530.2, "r_x3": 375.3, "r_y3": 530.2, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 377.1, "t": 534.8, "r": 406.9, "b": 539.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.1, "r_y0": 539.0, "r_x1": 406.9, "r_y1": 539.0, "r_x2": 406.9, "r_y2": 534.8, "r_x3": 377.1, "r_y3": 534.8, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 383.6, "t": 563.2, "r": 433.8, "b": 567.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.6, "r_y0": 567.5, "r_x1": 433.8, "r_y1": 567.5, "r_x2": 433.8, "r_y2": 563.2, "r_x3": 383.6, "r_y3": 563.2, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 383.5, "t": 567.8, "r": 433.8, "b": 572.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.5, "r_y0": 572.0, "r_x1": 433.8, "r_y1": 572.0, "r_x2": 433.8, "r_y2": 567.8, "r_x3": 383.5, "r_y3": 567.8, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 390.5, "t": 572.3, "r": 426.9, "b": 576.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.5, "r_y0": 576.6, "r_x1": 426.9, "r_y1": 576.6, "r_x2": 426.9, "r_y2": 572.3, "r_x3": 390.5, "r_y3": 572.3, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 293.9, "t": 577.9, "r": 323.2, "b": 582.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 582.2, "r_x1": 323.2, "r_y1": 582.2, "r_x2": 323.2, "r_y2": 577.9, "r_x3": 293.9, "r_y3": 577.9, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 293.9, "t": 582.4, "r": 324.6, "b": 586.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 586.7, "r_x1": 324.6, "r_y1": 586.7, "r_x2": 324.6, "r_y2": 582.4, "r_x3": 293.9, "r_y3": 582.4, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 333.1, "t": 541.8, "r": 364.1, "b": 546.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 546.1, "r_x1": 364.1, "r_y1": 546.1, "r_x2": 364.1, "r_y2": 541.8, "r_x3": 333.1, "r_y3": 541.8, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 333.1, "t": 545.6, "r": 369.7, "b": 549.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 549.9, "r_x1": 369.7, "r_y1": 549.9, "r_x2": 369.7, "r_y2": 545.6, "r_x3": 333.1, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 232.7, "t": 515.2, "r": 249.6, "b": 519.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.7, "r_y0": 519.5, "r_x1": 249.6, "r_y1": 519.5, "r_x2": 249.6, "r_y2": 515.2, "r_x3": 232.7, "r_y3": 515.2, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 269.8, "t": 546.0, "r": 288.3, "b": 550.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8, "r_y0": 550.2, "r_x1": 288.3, "r_y1": 550.2, "r_x2": 288.3, "r_y2": 546.0, "r_x3": 269.8, "r_y3": 546.0, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 270.5, "t": 549.8, "r": 287.6, "b": 554.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 554.0, "r_x1": 287.6, "r_y1": 554.0, "r_x2": 287.6, "r_y2": 549.8, "r_x3": 270.5, "r_y3": 549.8, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 332.2, "t": 515.9, "r": 358.1, "b": 520.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 520.2, "r_x1": 358.1, "r_y1": 520.2, "r_x2": 358.1, "r_y2": 515.9, "r_x3": 332.2, "r_y3": 515.9, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 332.2, "t": 522.0, "r": 361.6, "b": 526.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 526.2, "r_x1": 361.6, "r_y1": 526.2, "r_x2": 361.6, "r_y2": 522.0, "r_x3": 332.2, "r_y3": 522.0, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 332.2, "t": 528.0, "r": 364.8, "b": 532.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 532.3, "r_x1": 364.8, "r_y1": 532.3, "r_x2": 364.8, "r_y2": 528.0, "r_x3": 332.2, "r_y3": 528.0, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 332.2, "t": 534.1, "r": 336.0, "b": 538.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 538.4, "r_x1": 336.0, "r_y1": 538.4, "r_x2": 336.0, "r_y2": 534.1, "r_x3": 332.2, "r_y3": 534.1, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.9, "t": 516.4, "r": 329.4, "b": 520.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.9, "r_y0": 520.7, "r_x1": 329.4, "r_y1": 520.7, "r_x2": 329.4, "r_y2": 516.4, "r_x3": 326.9, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 327.0, "t": 522.4, "r": 329.6, "b": 526.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 526.7, "r_x1": 329.6, "r_y1": 526.7, "r_x2": 329.6, "r_y2": 522.4, "r_x3": 327.0, "r_y3": 522.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 327.0, "t": 528.5, "r": 329.6, "b": 532.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 532.8, "r_x1": 329.6, "r_y1": 532.8, "r_x2": 329.6, "r_y2": 528.5, "r_x3": 327.0, "r_y3": 528.5, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 424.1, "t": 527.4, "r": 426.7, "b": 531.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.1, "r_y0": 531.7, "r_x1": 426.7, "r_y1": 531.7, "r_x2": 426.7, "r_y2": 527.4, "r_x3": 424.1, "r_y3": 527.4, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 453.0, "t": 517.5, "r": 455.5, "b": 521.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.7, "r_x1": 455.5, "r_y1": 521.7, "r_x2": 455.5, "r_y2": 517.5, "r_x3": 453.0, "r_y3": 517.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 423.9, "t": 517.1, "r": 426.4, "b": 521.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.9, "r_y0": 521.3, "r_x1": 426.4, "r_y1": 521.3, "r_x2": 426.4, "r_y2": 517.1, "r_x3": 423.9, "r_y3": 517.1, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 333.4, "t": 557.4, "r": 337.3, "b": 562.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4, "r_y0": 562.4, "r_x1": 337.3, "r_y1": 562.4, "r_x2": 337.3, "r_y2": 557.4, "r_x3": 333.4, "r_y3": 557.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 340.4, "t": 557.3, "r": 344.2, "b": 562.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 562.3, "r_x1": 344.2, "r_y1": 562.3, "r_x2": 344.2, "r_y2": 557.3, "r_x3": 340.4, "r_y3": 557.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 340.3, "t": 563.9, "r": 344.2, "b": 568.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 568.9, "r_x1": 344.2, "r_y1": 568.9, "r_x2": 344.2, "r_y2": 563.9, "r_x3": 340.3, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 346.8, "t": 563.9, "r": 350.6, "b": 568.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.9, "r_x1": 350.6, "r_y1": 568.9, "r_x2": 350.6, "r_y2": 563.9, "r_x3": 346.8, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 333.6, "t": 563.8, "r": 337.4, "b": 568.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.8, "r_x1": 337.4, "r_y1": 568.8, "r_x2": 337.4, "r_y2": 563.8, "r_x3": 333.6, "r_y3": 563.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 340.4, "t": 570.4, "r": 344.2, "b": 575.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 575.4, "r_x1": 344.2, "r_y1": 575.4, "r_x2": 344.2, "r_y2": 570.4, "r_x3": 340.4, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 346.9, "t": 570.4, "r": 350.7, "b": 575.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 575.4, "r_x1": 350.7, "r_y1": 575.4, "r_x2": 350.7, "r_y2": 570.4, "r_x3": 346.9, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 333.7, "t": 570.4, "r": 337.5, "b": 575.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 575.4, "r_x1": 337.5, "r_y1": 575.4, "r_x2": 337.5, "r_y2": 570.4, "r_x3": 333.7, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 340.4, "t": 577.0, "r": 344.2, "b": 582.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 582.0, "r_x1": 344.2, "r_y1": 582.0, "r_x2": 344.2, "r_y2": 577.0, "r_x3": 340.4, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 346.9, "t": 577.0, "r": 350.7, "b": 582.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 582.0, "r_x1": 350.7, "r_y1": 582.0, "r_x2": 350.7, "r_y2": 577.0, "r_x3": 346.9, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 333.7, "t": 577.0, "r": 337.5, "b": 582.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 582.0, "r_x1": 337.5, "r_y1": 582.0, "r_x2": 337.5, "r_y2": 577.0, "r_x3": 333.7, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 340.3, "t": 583.4, "r": 344.1, "b": 588.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 588.4, "r_x1": 344.1, "r_y1": 588.4, "r_x2": 344.1, "r_y2": 583.4, "r_x3": 340.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 346.8, "t": 583.4, "r": 350.6, "b": 588.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 588.4, "r_x1": 350.6, "r_y1": 588.4, "r_x2": 350.6, "r_y2": 583.4, "r_x3": 346.8, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 333.6, "t": 583.4, "r": 337.4, "b": 588.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 588.3, "r_x1": 337.4, "r_y1": 588.3, "r_x2": 337.4, "r_y2": 583.4, "r_x3": 333.6, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 353.0, "t": 556.9, "r": 359.8, "b": 561.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.0, "r_y0": 561.9, "r_x1": 359.8, "r_y1": 561.9, "r_x2": 359.8, "r_y2": 556.9, "r_x3": 353.0, "r_y3": 556.9, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 353.2, "t": 563.6, "r": 360.0, "b": 568.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 568.6, "r_x1": 360.0, "r_y1": 568.6, "r_x2": 360.0, "r_y2": 563.6, "r_x3": 353.2, "r_y3": 563.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 353.2, "t": 570.2, "r": 360.0, "b": 575.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.2, "r_x1": 360.0, "r_y1": 575.2, "r_x2": 360.0, "r_y2": 570.2, "r_x3": 353.2, "r_y3": 570.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 353.2, "t": 576.8, "r": 360.0, "b": 581.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 581.8, "r_x1": 360.0, "r_y1": 581.8, "r_x2": 360.0, "r_y2": 576.8, "r_x3": 353.2, "r_y3": 576.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 353.3, "t": 583.4, "r": 360.1, "b": 588.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.3, "r_y0": 588.4, "r_x1": 360.1, "r_y1": 588.4, "r_x2": 360.1, "r_y2": 583.4, "r_x3": 353.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 347.4, "t": 557.1, "r": 350.3, "b": 562.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.4, "r_y0": 562.1, "r_x1": 350.3, "r_y1": 562.1, "r_x2": 350.3, "r_y2": 557.1, "r_x3": 347.4, "r_y3": 557.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 331.1, "t": 564.3, "r": 333.7, "b": 568.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.1, "r_y0": 568.6, "r_x1": 333.7, "r_y1": 568.6, "r_x2": 333.7, "r_y2": 564.3, "r_x3": 331.1, "r_y3": 564.3, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 340.8, "t": 554.6, "r": 343.3, "b": 558.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.8, "r_y0": 558.9, "r_x1": 343.3, "r_y1": 558.9, "r_x2": 343.3, "r_y2": 554.6, "r_x3": 340.8, "r_y3": 554.6, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 331.0, "t": 554.8, "r": 333.5, "b": 559.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.0, "r_y0": 559.1, "r_x1": 333.5, "r_y1": 559.1, "r_x2": 333.5, "r_y2": 554.8, "r_x3": 331.0, "r_y3": 554.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 4, "page_no": 7, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.8, "t": 620.2, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 149.7, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "cells. The predicted OTSL structures were converted back to HTML format in", "orig": "cells. The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for table structure prediction, and Mean Average Precision (mAP) with 0.75 Intersection Over Union (IOU) threshold for the bounding-box predictions of table cells. The predicted OTSL structures were converted back to HTML format in" } ], "body": [ { "label": "text", "id": 5, "page_no": 7, "cluster": { "id": 5, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 139.7, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 163.6, "r_y1": 139.7, "r_x2": 163.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "reduces significantly the column drift seen in the HTML based models (see Figure 5)." }, { "label": "section_header", "id": 2, "page_no": 7, "cluster": { "id": 2, "label": "section_header", "bbox": { "l": 134.8, "t": 161.6, "r": 319.3, "b": 170.4, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 170.4, "r_x1": 149.4, "r_y1": 170.4, "r_x2": 149.4, "r_y2": 161.6, "r_x3": 134.8, "r_y3": 161.6, "coord_origin": "TOPLEFT" }, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 170.4, "r_x1": 319.3, "r_y1": 170.4, "r_x2": 319.3, "r_y2": 161.6, "r_x3": 160.9, "r_y3": 161.6, "coord_origin": "TOPLEFT" }, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.3 Error-detection and -mitigation" }, { "label": "text", "id": 0, "page_no": 7, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 182.3, "r": 480.6, "b": 298.7, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 191.1, "r_x1": 480.6, "r_y1": 191.1, "r_x2": 480.6, "r_y2": 182.3, "r_x3": 134.8, "r_y3": 182.3, "coord_origin": "TOPLEFT" }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 203.0, "r_x1": 480.6, "r_y1": 203.0, "r_x2": 480.6, "r_y2": 194.2, "r_x3": 134.8, "r_y3": 194.2, "coord_origin": "TOPLEFT" }, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 215.0, "r_x1": 480.6, "r_y1": 215.0, "r_x2": 480.6, "r_y2": 206.2, "r_x3": 134.8, "r_y3": 206.2, "coord_origin": "TOPLEFT" }, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 226.9, "r_x1": 480.6, "r_y1": 226.9, "r_x2": 480.6, "r_y2": 218.1, "r_x3": 134.8, "r_y3": 218.1, "coord_origin": "TOPLEFT" }, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 238.9, "r_x1": 480.6, "r_y1": 238.9, "r_x2": 480.6, "r_y2": 230.1, "r_x3": 134.8, "r_y3": 230.1, "coord_origin": "TOPLEFT" }, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 250.9, "r_x1": 480.6, "r_y1": 250.9, "r_x2": 480.6, "r_y2": 242.1, "r_x3": 134.8, "r_y3": 242.1, "coord_origin": "TOPLEFT" }, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 262.8, "r_x1": 480.6, "r_y1": 262.8, "r_x2": 480.6, "r_y2": 254.0, "r_x3": 134.8, "r_y3": 254.0, "coord_origin": "TOPLEFT" }, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 274.8, "r_x1": 480.6, "r_y1": 274.8, "r_x2": 480.6, "r_y2": 266.0, "r_x3": 134.8, "r_y3": 266.0, "coord_origin": "TOPLEFT" }, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 286.7, "r_x1": 480.6, "r_y1": 286.7, "r_x2": 480.6, "r_y2": 277.9, "r_x3": 134.8, "r_y3": 277.9, "coord_origin": "TOPLEFT" }, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 298.7, "r_x1": 469.4, "r_y1": 298.7, "r_x2": 469.4, "r_y2": 289.9, "r_x3": 134.8, "r_y3": 289.9, "coord_origin": "TOPLEFT" }, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished sequence. The detection of an invalid sequence token is a clear indication of a prediction mistake, however a valid sequence by itself does not guarantee prediction correctness. Different heuristics can be used to correct token errors in an invalid sequence and thus increase the chances for accurate predictions. Such heuristics can be applied either after the prediction of each token, or at the end on the entire predicted sequence. For example a simple heuristic which can correct the predicted OTSL sequence on-the-fly is to verify if the token with the highest prediction confidence invalidates the predicted sequence, and replace it by the token with the next highest confidence until OTSL rules are satisfied." }, { "label": "section_header", "id": 3, "page_no": 7, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.8, "t": 321.2, "r": 229.0, "b": 331.7, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 331.7, "r_x1": 141.5, "r_y1": 331.7, "r_x2": 141.5, "r_y2": 321.2, "r_x3": 134.8, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 331.7, "r_x1": 229.0, "r_y1": 331.7, "r_x2": 229.0, "r_y2": 321.2, "r_x3": 154.9, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5 Experiments" }, { "label": "text", "id": 1, "page_no": 7, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 347.2, "r": 480.6, "b": 451.7, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 356.0, "r_x1": 480.6, "r_y1": 356.0, "r_x2": 480.6, "r_y2": 347.2, "r_x3": 134.8, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 368.0, "r_x1": 480.6, "r_y1": 368.0, "r_x2": 480.6, "r_y2": 359.2, "r_x3": 134.8, "r_y3": 359.2, "coord_origin": "TOPLEFT" }, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 380.0, "r_x1": 480.6, "r_y1": 380.0, "r_x2": 480.6, "r_y2": 371.2, "r_x3": 134.8, "r_y3": 371.2, "coord_origin": "TOPLEFT" }, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 391.9, "r_x1": 480.6, "r_y1": 391.9, "r_x2": 480.6, "r_y2": 383.1, "r_x3": 134.8, "r_y3": 383.1, "coord_origin": "TOPLEFT" }, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 403.9, "r_x1": 148.6, "r_y1": 403.9, "r_x2": 148.6, "r_y2": 395.1, "r_x3": 134.8, "r_y3": 395.1, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.6, "r_y0": 403.9, "r_x1": 191.8, "r_y1": 403.9, "r_x2": 191.8, "r_y2": 395.1, "r_x3": 151.6, "r_y3": 395.1, "coord_origin": "TOPLEFT" }, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 403.9, "r_x1": 480.6, "r_y1": 403.9, "r_x2": 480.6, "r_y2": 395.1, "r_x3": 195.9, "r_y3": 395.1, "coord_origin": "TOPLEFT" }, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 415.8, "r_x1": 480.6, "r_y1": 415.8, "r_x2": 480.6, "r_y2": 407.0, "r_x3": 134.8, "r_y3": 407.0, "coord_origin": "TOPLEFT" }, "text": "found in the first step and evaluate how OTSL impacts the performance of", "orig": "found in the first step and evaluate how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 427.8, "r_x1": 480.6, "r_y1": 427.8, "r_x2": 480.6, "r_y2": 419.0, "r_x3": 134.8, "r_y3": 419.0, "coord_origin": "TOPLEFT" }, "text": "TableFormer after training on other publicly available data sets (FinTabNet,", "orig": "TableFormer after training on other publicly available data sets (FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 439.7, "r_x1": 480.6, "r_y1": 439.7, "r_x2": 480.6, "r_y2": 430.9, "r_x3": 134.8, "r_y3": 430.9, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 451.7, "r_x1": 479.3, "r_y1": 451.7, "r_x2": 479.3, "r_y2": 442.9, "r_x3": 134.8, "r_y3": 442.9, "coord_origin": "TOPLEFT" }, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we conducted a series of experiments based on the TableFormer model (Figure 4) with two objectives: Firstly we evaluate the prediction quality and performance of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on the canonical PubTabNet data set. Secondly we pick the best hyper-parameters found in the first step and evaluate how OTSL impacts the performance of TableFormer after training on other publicly available data sets (FinTabNet, PubTables-1M [14]). The ground truth (GT) from all data sets has been converted into OTSL format for this purpose, and will be made publicly available." }, { "label": "caption", "id": 7, "page_no": 7, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 134.8, "t": 484.6, "r": 480.6, "b": 503.7, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 492.6, "r_x1": 162.6, "r_y1": 492.6, "r_x2": 162.6, "r_y2": 484.6, "r_x3": 134.8, "r_y3": 484.6, "coord_origin": "TOPLEFT" }, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.2, "r_y0": 492.8, "r_x1": 480.6, "r_y1": 492.8, "r_x2": 480.6, "r_y2": 484.7, "r_x3": 165.2, "r_y3": 484.7, "coord_origin": "TOPLEFT" }, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 503.7, "r_x1": 206.7, "r_y1": 503.7, "r_x2": 206.7, "r_y2": 495.7, "r_x3": 134.8, "r_y3": 495.7, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 4. Architecture sketch of the TableFormer model, which is a representative for the Im2Seq approach." }, { "label": "picture", "id": 6, "page_no": 7, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 140.7, "t": 508.1, "r": 472.7, "b": 593.7, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.7, "r_y1": 543.1, "r_x2": 149.7, "r_y2": 540.7, "r_x3": 147.3, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 543.1, "r_x1": 155.7, "r_y1": 543.1, "r_x2": 155.7, "r_y2": 540.7, "r_x3": 150.9, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.8, "r_y0": 537.8, "r_x1": 172.3, "r_y1": 537.8, "r_x2": 172.3, "r_y2": 535.4, "r_x3": 162.8, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.6, "r_y0": 537.7, "r_x1": 155.9, "r_y1": 537.7, "r_x2": 155.9, "r_y2": 535.4, "r_x3": 147.6, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.7, "r_x3": 158.5, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 547.0, "r_x1": 162.7, "r_y1": 547.0, "r_x2": 162.7, "r_y2": 544.7, "r_x3": 158.5, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 551.3, "r_x1": 164.1, "r_y1": 551.3, "r_x2": 164.1, "r_y2": 548.9, "r_x3": 158.5, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 555.5, "r_x1": 162.7, "r_y1": 555.5, "r_x2": 162.7, "r_y2": 553.2, "r_x3": 158.5, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 543.1, "r_x1": 172.9, "r_y1": 543.1, "r_x2": 172.9, "r_y2": 540.7, "r_x3": 168.8, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 547.0, "r_x1": 172.9, "r_y1": 547.0, "r_x2": 172.9, "r_y2": 544.7, "r_x3": 168.8, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 551.3, "r_x1": 172.9, "r_y1": 551.3, "r_x2": 172.9, "r_y2": 548.9, "r_x3": 168.8, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 555.5, "r_x1": 172.9, "r_y1": 555.5, "r_x2": 172.9, "r_y2": 553.2, "r_x3": 168.8, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.0, "r_x1": 149.7, "r_y1": 547.0, "r_x2": 149.7, "r_y2": 544.7, "r_x3": 147.3, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 547.0, "r_x1": 155.7, "r_y1": 547.0, "r_x2": 155.7, "r_y2": 544.7, "r_x3": 150.9, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.3, "r_x1": 149.7, "r_y1": 551.3, "r_x2": 149.7, "r_y2": 548.9, "r_x3": 147.3, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 551.3, "r_x1": 155.7, "r_y1": 551.3, "r_x2": 155.7, "r_y2": 548.9, "r_x3": 150.9, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.5, "r_x1": 149.7, "r_y1": 555.5, "r_x2": 149.7, "r_y2": 553.2, "r_x3": 147.3, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 555.5, "r_x1": 155.7, "r_y1": 555.5, "r_x2": 155.7, "r_y2": 553.2, "r_x3": 150.9, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.1, "r_y0": 521.3, "r_x1": 171.2, "r_y1": 521.3, "r_x2": 171.2, "r_y2": 517.0, "r_x3": 152.1, "r_y3": 517.0, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.1, "r_y0": 526.6, "r_x1": 175.2, "r_y1": 526.6, "r_x2": 175.2, "r_y2": 522.3, "r_x3": 148.1, "r_y3": 522.3, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.5, "r_y0": 528.8, "r_x1": 220.3, "r_y1": 528.8, "r_x2": 220.3, "r_y2": 524.5, "r_x3": 193.5, "r_y3": 524.5, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.5, "r_y0": 534.1, "r_x1": 214.4, "r_y1": 534.1, "r_x2": 214.4, "r_y2": 529.8, "r_x3": 199.5, "r_y3": 529.8, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.6, "r_y0": 514.2, "r_x1": 284.5, "r_y1": 514.2, "r_x2": 284.5, "r_y2": 509.9, "r_x3": 273.6, "r_y3": 509.9, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 518.0, "r_x1": 287.6, "r_y1": 518.0, "r_x2": 287.6, "r_y2": 513.7, "r_x3": 270.5, "r_y3": 513.7, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.5, "r_y0": 512.4, "r_x1": 348.1, "r_y1": 512.4, "r_x2": 348.1, "r_y2": 508.1, "r_x3": 332.5, "r_y3": 508.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.7, "r_y0": 525.4, "r_x1": 407.3, "r_y1": 525.4, "r_x2": 407.3, "r_y2": 521.1, "r_x3": 376.7, "r_y3": 521.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.9, "r_y0": 529.9, "r_x1": 410.0, "r_y1": 529.9, "r_x2": 410.0, "r_y2": 525.7, "r_x3": 373.9, "r_y3": 525.7, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.5, "r_x1": 408.6, "r_y1": 534.5, "r_x2": 408.6, "r_y2": 530.2, "r_x3": 375.3, "r_y3": 530.2, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.1, "r_y0": 539.0, "r_x1": 406.9, "r_y1": 539.0, "r_x2": 406.9, "r_y2": 534.8, "r_x3": 377.1, "r_y3": 534.8, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.6, "r_y0": 567.5, "r_x1": 433.8, "r_y1": 567.5, "r_x2": 433.8, "r_y2": 563.2, "r_x3": 383.6, "r_y3": 563.2, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.5, "r_y0": 572.0, "r_x1": 433.8, "r_y1": 572.0, "r_x2": 433.8, "r_y2": 567.8, "r_x3": 383.5, "r_y3": 567.8, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.5, "r_y0": 576.6, "r_x1": 426.9, "r_y1": 576.6, "r_x2": 426.9, "r_y2": 572.3, "r_x3": 390.5, "r_y3": 572.3, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 582.2, "r_x1": 323.2, "r_y1": 582.2, "r_x2": 323.2, "r_y2": 577.9, "r_x3": 293.9, "r_y3": 577.9, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 586.7, "r_x1": 324.6, "r_y1": 586.7, "r_x2": 324.6, "r_y2": 582.4, "r_x3": 293.9, "r_y3": 582.4, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 546.1, "r_x1": 364.1, "r_y1": 546.1, "r_x2": 364.1, "r_y2": 541.8, "r_x3": 333.1, "r_y3": 541.8, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 549.9, "r_x1": 369.7, "r_y1": 549.9, "r_x2": 369.7, "r_y2": 545.6, "r_x3": 333.1, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.7, "r_y0": 519.5, "r_x1": 249.6, "r_y1": 519.5, "r_x2": 249.6, "r_y2": 515.2, "r_x3": 232.7, "r_y3": 515.2, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8, "r_y0": 550.2, "r_x1": 288.3, "r_y1": 550.2, "r_x2": 288.3, "r_y2": 546.0, "r_x3": 269.8, "r_y3": 546.0, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 554.0, "r_x1": 287.6, "r_y1": 554.0, "r_x2": 287.6, "r_y2": 549.8, "r_x3": 270.5, "r_y3": 549.8, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 520.2, "r_x1": 358.1, "r_y1": 520.2, "r_x2": 358.1, "r_y2": 515.9, "r_x3": 332.2, "r_y3": 515.9, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 526.2, "r_x1": 361.6, "r_y1": 526.2, "r_x2": 361.6, "r_y2": 522.0, "r_x3": 332.2, "r_y3": 522.0, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 532.3, "r_x1": 364.8, "r_y1": 532.3, "r_x2": 364.8, "r_y2": 528.0, "r_x3": 332.2, "r_y3": 528.0, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 538.4, "r_x1": 336.0, "r_y1": 538.4, "r_x2": 336.0, "r_y2": 534.1, "r_x3": 332.2, "r_y3": 534.1, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.9, "r_y0": 520.7, "r_x1": 329.4, "r_y1": 520.7, "r_x2": 329.4, "r_y2": 516.4, "r_x3": 326.9, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 526.7, "r_x1": 329.6, "r_y1": 526.7, "r_x2": 329.6, "r_y2": 522.4, "r_x3": 327.0, "r_y3": 522.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 532.8, "r_x1": 329.6, "r_y1": 532.8, "r_x2": 329.6, "r_y2": 528.5, "r_x3": 327.0, "r_y3": 528.5, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.1, "r_y0": 531.7, "r_x1": 426.7, "r_y1": 531.7, "r_x2": 426.7, "r_y2": 527.4, "r_x3": 424.1, "r_y3": 527.4, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.7, "r_x1": 455.5, "r_y1": 521.7, "r_x2": 455.5, "r_y2": 517.5, "r_x3": 453.0, "r_y3": 517.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.9, "r_y0": 521.3, "r_x1": 426.4, "r_y1": 521.3, "r_x2": 426.4, "r_y2": 517.1, "r_x3": 423.9, "r_y3": 517.1, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4, "r_y0": 562.4, "r_x1": 337.3, "r_y1": 562.4, "r_x2": 337.3, "r_y2": 557.4, "r_x3": 333.4, "r_y3": 557.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 562.3, "r_x1": 344.2, "r_y1": 562.3, "r_x2": 344.2, "r_y2": 557.3, "r_x3": 340.4, "r_y3": 557.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 568.9, "r_x1": 344.2, "r_y1": 568.9, "r_x2": 344.2, "r_y2": 563.9, "r_x3": 340.3, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.9, "r_x1": 350.6, "r_y1": 568.9, "r_x2": 350.6, "r_y2": 563.9, "r_x3": 346.8, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.8, "r_x1": 337.4, "r_y1": 568.8, "r_x2": 337.4, "r_y2": 563.8, "r_x3": 333.6, "r_y3": 563.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 575.4, "r_x1": 344.2, "r_y1": 575.4, "r_x2": 344.2, "r_y2": 570.4, "r_x3": 340.4, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 575.4, "r_x1": 350.7, "r_y1": 575.4, "r_x2": 350.7, "r_y2": 570.4, "r_x3": 346.9, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 575.4, "r_x1": 337.5, "r_y1": 575.4, "r_x2": 337.5, "r_y2": 570.4, "r_x3": 333.7, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 582.0, "r_x1": 344.2, "r_y1": 582.0, "r_x2": 344.2, "r_y2": 577.0, "r_x3": 340.4, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 582.0, "r_x1": 350.7, "r_y1": 582.0, "r_x2": 350.7, "r_y2": 577.0, "r_x3": 346.9, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 582.0, "r_x1": 337.5, "r_y1": 582.0, "r_x2": 337.5, "r_y2": 577.0, "r_x3": 333.7, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 588.4, "r_x1": 344.1, "r_y1": 588.4, "r_x2": 344.1, "r_y2": 583.4, "r_x3": 340.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 588.4, "r_x1": 350.6, "r_y1": 588.4, "r_x2": 350.6, "r_y2": 583.4, "r_x3": 346.8, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 588.3, "r_x1": 337.4, "r_y1": 588.3, "r_x2": 337.4, "r_y2": 583.4, "r_x3": 333.6, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.0, "r_y0": 561.9, "r_x1": 359.8, "r_y1": 561.9, "r_x2": 359.8, "r_y2": 556.9, "r_x3": 353.0, "r_y3": 556.9, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 568.6, "r_x1": 360.0, "r_y1": 568.6, "r_x2": 360.0, "r_y2": 563.6, "r_x3": 353.2, "r_y3": 563.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.2, "r_x1": 360.0, "r_y1": 575.2, "r_x2": 360.0, "r_y2": 570.2, "r_x3": 353.2, "r_y3": 570.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 581.8, "r_x1": 360.0, "r_y1": 581.8, "r_x2": 360.0, "r_y2": 576.8, "r_x3": 353.2, "r_y3": 576.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.3, "r_y0": 588.4, "r_x1": 360.1, "r_y1": 588.4, "r_x2": 360.1, "r_y2": 583.4, "r_x3": 353.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.4, "r_y0": 562.1, "r_x1": 350.3, "r_y1": 562.1, "r_x2": 350.3, "r_y2": 557.1, "r_x3": 347.4, "r_y3": 557.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.1, "r_y0": 568.6, "r_x1": 333.7, "r_y1": 568.6, "r_x2": 333.7, "r_y2": 564.3, "r_x3": 331.1, "r_y3": 564.3, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.8, "r_y0": 558.9, "r_x1": 343.3, "r_y1": 558.9, "r_x2": 343.3, "r_y2": 554.6, "r_x3": 340.8, "r_y3": 554.6, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.0, "r_y0": 559.1, "r_x1": 333.5, "r_y1": 559.1, "r_x2": 333.5, "r_y2": 554.8, "r_x3": 331.0, "r_y3": 554.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 13, "label": "text", "bbox": { "l": 147.3, "t": 540.7, "r": 149.7, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.7, "r_y1": 543.1, "r_x2": 149.7, "r_y2": 540.7, "r_x3": 147.3, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 150.9, "t": 540.7, "r": 155.7, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 543.1, "r_x1": 155.7, "r_y1": 543.1, "r_x2": 155.7, "r_y2": 540.7, "r_x3": 150.9, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 162.8, "t": 535.4, "r": 172.3, "b": 537.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.8, "r_y0": 537.8, "r_x1": 172.3, "r_y1": 537.8, "r_x2": 172.3, "r_y2": 535.4, "r_x3": 162.8, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 147.6, "t": 535.4, "r": 155.9, "b": 537.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.6, "r_y0": 537.7, "r_x1": 155.9, "r_y1": 537.7, "r_x2": 155.9, "r_y2": 535.4, "r_x3": 147.6, "r_y3": 535.4, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 158.5, "t": 540.7, "r": 164.1, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.7, "r_x3": 158.5, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 158.5, "t": 544.7, "r": 162.7, "b": 547.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 547.0, "r_x1": 162.7, "r_y1": 547.0, "r_x2": 162.7, "r_y2": 544.7, "r_x3": 158.5, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 158.5, "t": 548.9, "r": 164.1, "b": 551.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 551.3, "r_x1": 164.1, "r_y1": 551.3, "r_x2": 164.1, "r_y2": 548.9, "r_x3": 158.5, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 158.5, "t": 553.2, "r": 162.7, "b": 555.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.5, "r_y0": 555.5, "r_x1": 162.7, "r_y1": 555.5, "r_x2": 162.7, "r_y2": 553.2, "r_x3": 158.5, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 168.8, "t": 540.7, "r": 172.9, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 543.1, "r_x1": 172.9, "r_y1": 543.1, "r_x2": 172.9, "r_y2": 540.7, "r_x3": 168.8, "r_y3": 540.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 168.8, "t": 544.7, "r": 172.9, "b": 547.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 547.0, "r_x1": 172.9, "r_y1": 547.0, "r_x2": 172.9, "r_y2": 544.7, "r_x3": 168.8, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 168.8, "t": 548.9, "r": 172.9, "b": 551.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 551.3, "r_x1": 172.9, "r_y1": 551.3, "r_x2": 172.9, "r_y2": 548.9, "r_x3": 168.8, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 168.8, "t": 553.2, "r": 172.9, "b": 555.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.8, "r_y0": 555.5, "r_x1": 172.9, "r_y1": 555.5, "r_x2": 172.9, "r_y2": 553.2, "r_x3": 168.8, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 147.3, "t": 544.7, "r": 149.7, "b": 547.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.0, "r_x1": 149.7, "r_y1": 547.0, "r_x2": 149.7, "r_y2": 544.7, "r_x3": 147.3, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 150.9, "t": 544.7, "r": 155.7, "b": 547.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 547.0, "r_x1": 155.7, "r_y1": 547.0, "r_x2": 155.7, "r_y2": 544.7, "r_x3": 150.9, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 147.3, "t": 548.9, "r": 149.7, "b": 551.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.3, "r_x1": 149.7, "r_y1": 551.3, "r_x2": 149.7, "r_y2": 548.9, "r_x3": 147.3, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 150.9, "t": 548.9, "r": 155.7, "b": 551.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 551.3, "r_x1": 155.7, "r_y1": 551.3, "r_x2": 155.7, "r_y2": 548.9, "r_x3": 150.9, "r_y3": 548.9, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 147.3, "t": 553.2, "r": 149.7, "b": 555.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.5, "r_x1": 149.7, "r_y1": 555.5, "r_x2": 149.7, "r_y2": 553.2, "r_x3": 147.3, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 150.9, "t": 553.2, "r": 155.7, "b": 555.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 555.5, "r_x1": 155.7, "r_y1": 555.5, "r_x2": 155.7, "r_y2": 553.2, "r_x3": 150.9, "r_y3": 553.2, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 152.1, "t": 517.0, "r": 171.2, "b": 521.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.1, "r_y0": 521.3, "r_x1": 171.2, "r_y1": 521.3, "r_x2": 171.2, "r_y2": 517.0, "r_x3": 152.1, "r_y3": 517.0, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 148.1, "t": 522.3, "r": 175.2, "b": 526.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.1, "r_y0": 526.6, "r_x1": 175.2, "r_y1": 526.6, "r_x2": 175.2, "r_y2": 522.3, "r_x3": 148.1, "r_y3": 522.3, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 193.5, "t": 524.5, "r": 220.3, "b": 528.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.5, "r_y0": 528.8, "r_x1": 220.3, "r_y1": 528.8, "r_x2": 220.3, "r_y2": 524.5, "r_x3": 193.5, "r_y3": 524.5, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 199.5, "t": 529.8, "r": 214.4, "b": 534.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.5, "r_y0": 534.1, "r_x1": 214.4, "r_y1": 534.1, "r_x2": 214.4, "r_y2": 529.8, "r_x3": 199.5, "r_y3": 529.8, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 273.6, "t": 509.9, "r": 284.5, "b": 514.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.6, "r_y0": 514.2, "r_x1": 284.5, "r_y1": 514.2, "r_x2": 284.5, "r_y2": 509.9, "r_x3": 273.6, "r_y3": 509.9, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 270.5, "t": 513.7, "r": 287.6, "b": 518.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 518.0, "r_x1": 287.6, "r_y1": 518.0, "r_x2": 287.6, "r_y2": 513.7, "r_x3": 270.5, "r_y3": 513.7, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 332.5, "t": 508.1, "r": 348.1, "b": 512.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.5, "r_y0": 512.4, "r_x1": 348.1, "r_y1": 512.4, "r_x2": 348.1, "r_y2": 508.1, "r_x3": 332.5, "r_y3": 508.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 376.7, "t": 521.1, "r": 407.3, "b": 525.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.7, "r_y0": 525.4, "r_x1": 407.3, "r_y1": 525.4, "r_x2": 407.3, "r_y2": 521.1, "r_x3": 376.7, "r_y3": 521.1, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 373.9, "t": 525.7, "r": 410.0, "b": 529.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.9, "r_y0": 529.9, "r_x1": 410.0, "r_y1": 529.9, "r_x2": 410.0, "r_y2": 525.7, "r_x3": 373.9, "r_y3": 525.7, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 375.3, "t": 530.2, "r": 408.6, "b": 534.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.5, "r_x1": 408.6, "r_y1": 534.5, "r_x2": 408.6, "r_y2": 530.2, "r_x3": 375.3, "r_y3": 530.2, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 377.1, "t": 534.8, "r": 406.9, "b": 539.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.1, "r_y0": 539.0, "r_x1": 406.9, "r_y1": 539.0, "r_x2": 406.9, "r_y2": 534.8, "r_x3": 377.1, "r_y3": 534.8, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 383.6, "t": 563.2, "r": 433.8, "b": 567.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.6, "r_y0": 567.5, "r_x1": 433.8, "r_y1": 567.5, "r_x2": 433.8, "r_y2": 563.2, "r_x3": 383.6, "r_y3": 563.2, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 383.5, "t": 567.8, "r": 433.8, "b": 572.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.5, "r_y0": 572.0, "r_x1": 433.8, "r_y1": 572.0, "r_x2": 433.8, "r_y2": 567.8, "r_x3": 383.5, "r_y3": 567.8, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 390.5, "t": 572.3, "r": 426.9, "b": 576.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.5, "r_y0": 576.6, "r_x1": 426.9, "r_y1": 576.6, "r_x2": 426.9, "r_y2": 572.3, "r_x3": 390.5, "r_y3": 572.3, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 293.9, "t": 577.9, "r": 323.2, "b": 582.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 582.2, "r_x1": 323.2, "r_y1": 582.2, "r_x2": 323.2, "r_y2": 577.9, "r_x3": 293.9, "r_y3": 577.9, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 293.9, "t": 582.4, "r": 324.6, "b": 586.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.9, "r_y0": 586.7, "r_x1": 324.6, "r_y1": 586.7, "r_x2": 324.6, "r_y2": 582.4, "r_x3": 293.9, "r_y3": 582.4, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 333.1, "t": 541.8, "r": 364.1, "b": 546.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 546.1, "r_x1": 364.1, "r_y1": 546.1, "r_x2": 364.1, "r_y2": 541.8, "r_x3": 333.1, "r_y3": 541.8, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 333.1, "t": 545.6, "r": 369.7, "b": 549.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.1, "r_y0": 549.9, "r_x1": 369.7, "r_y1": 549.9, "r_x2": 369.7, "r_y2": 545.6, "r_x3": 333.1, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 232.7, "t": 515.2, "r": 249.6, "b": 519.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.7, "r_y0": 519.5, "r_x1": 249.6, "r_y1": 519.5, "r_x2": 249.6, "r_y2": 515.2, "r_x3": 232.7, "r_y3": 515.2, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 269.8, "t": 546.0, "r": 288.3, "b": 550.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.8, "r_y0": 550.2, "r_x1": 288.3, "r_y1": 550.2, "r_x2": 288.3, "r_y2": 546.0, "r_x3": 269.8, "r_y3": 546.0, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 270.5, "t": 549.8, "r": 287.6, "b": 554.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.5, "r_y0": 554.0, "r_x1": 287.6, "r_y1": 554.0, "r_x2": 287.6, "r_y2": 549.8, "r_x3": 270.5, "r_y3": 549.8, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 332.2, "t": 515.9, "r": 358.1, "b": 520.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 520.2, "r_x1": 358.1, "r_y1": 520.2, "r_x2": 358.1, "r_y2": 515.9, "r_x3": 332.2, "r_y3": 515.9, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 332.2, "t": 522.0, "r": 361.6, "b": 526.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 526.2, "r_x1": 361.6, "r_y1": 526.2, "r_x2": 361.6, "r_y2": 522.0, "r_x3": 332.2, "r_y3": 522.0, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 332.2, "t": 528.0, "r": 364.8, "b": 532.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 532.3, "r_x1": 364.8, "r_y1": 532.3, "r_x2": 364.8, "r_y2": 528.0, "r_x3": 332.2, "r_y3": 528.0, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 332.2, "t": 534.1, "r": 336.0, "b": 538.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.2, "r_y0": 538.4, "r_x1": 336.0, "r_y1": 538.4, "r_x2": 336.0, "r_y2": 534.1, "r_x3": 332.2, "r_y3": 534.1, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.9, "t": 516.4, "r": 329.4, "b": 520.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.9, "r_y0": 520.7, "r_x1": 329.4, "r_y1": 520.7, "r_x2": 329.4, "r_y2": 516.4, "r_x3": 326.9, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 327.0, "t": 522.4, "r": 329.6, "b": 526.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 526.7, "r_x1": 329.6, "r_y1": 526.7, "r_x2": 329.6, "r_y2": 522.4, "r_x3": 327.0, "r_y3": 522.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 327.0, "t": 528.5, "r": 329.6, "b": 532.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.0, "r_y0": 532.8, "r_x1": 329.6, "r_y1": 532.8, "r_x2": 329.6, "r_y2": 528.5, "r_x3": 327.0, "r_y3": 528.5, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 424.1, "t": 527.4, "r": 426.7, "b": 531.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.1, "r_y0": 531.7, "r_x1": 426.7, "r_y1": 531.7, "r_x2": 426.7, "r_y2": 527.4, "r_x3": 424.1, "r_y3": 527.4, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 453.0, "t": 517.5, "r": 455.5, "b": 521.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.7, "r_x1": 455.5, "r_y1": 521.7, "r_x2": 455.5, "r_y2": 517.5, "r_x3": 453.0, "r_y3": 517.5, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 423.9, "t": 517.1, "r": 426.4, "b": 521.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.9, "r_y0": 521.3, "r_x1": 426.4, "r_y1": 521.3, "r_x2": 426.4, "r_y2": 517.1, "r_x3": 423.9, "r_y3": 517.1, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 333.4, "t": 557.4, "r": 337.3, "b": 562.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.4, "r_y0": 562.4, "r_x1": 337.3, "r_y1": 562.4, "r_x2": 337.3, "r_y2": 557.4, "r_x3": 333.4, "r_y3": 557.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 340.4, "t": 557.3, "r": 344.2, "b": 562.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 562.3, "r_x1": 344.2, "r_y1": 562.3, "r_x2": 344.2, "r_y2": 557.3, "r_x3": 340.4, "r_y3": 557.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 340.3, "t": 563.9, "r": 344.2, "b": 568.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 568.9, "r_x1": 344.2, "r_y1": 568.9, "r_x2": 344.2, "r_y2": 563.9, "r_x3": 340.3, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 346.8, "t": 563.9, "r": 350.6, "b": 568.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.9, "r_x1": 350.6, "r_y1": 568.9, "r_x2": 350.6, "r_y2": 563.9, "r_x3": 346.8, "r_y3": 563.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 333.6, "t": 563.8, "r": 337.4, "b": 568.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.8, "r_x1": 337.4, "r_y1": 568.8, "r_x2": 337.4, "r_y2": 563.8, "r_x3": 333.6, "r_y3": 563.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 340.4, "t": 570.4, "r": 344.2, "b": 575.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 575.4, "r_x1": 344.2, "r_y1": 575.4, "r_x2": 344.2, "r_y2": 570.4, "r_x3": 340.4, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 346.9, "t": 570.4, "r": 350.7, "b": 575.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 575.4, "r_x1": 350.7, "r_y1": 575.4, "r_x2": 350.7, "r_y2": 570.4, "r_x3": 346.9, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 333.7, "t": 570.4, "r": 337.5, "b": 575.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 575.4, "r_x1": 337.5, "r_y1": 575.4, "r_x2": 337.5, "r_y2": 570.4, "r_x3": 333.7, "r_y3": 570.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 340.4, "t": 577.0, "r": 344.2, "b": 582.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.4, "r_y0": 582.0, "r_x1": 344.2, "r_y1": 582.0, "r_x2": 344.2, "r_y2": 577.0, "r_x3": 340.4, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 346.9, "t": 577.0, "r": 350.7, "b": 582.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.9, "r_y0": 582.0, "r_x1": 350.7, "r_y1": 582.0, "r_x2": 350.7, "r_y2": 577.0, "r_x3": 346.9, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 333.7, "t": 577.0, "r": 337.5, "b": 582.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.7, "r_y0": 582.0, "r_x1": 337.5, "r_y1": 582.0, "r_x2": 337.5, "r_y2": 577.0, "r_x3": 333.7, "r_y3": 577.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 340.3, "t": 583.4, "r": 344.1, "b": 588.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.3, "r_y0": 588.4, "r_x1": 344.1, "r_y1": 588.4, "r_x2": 344.1, "r_y2": 583.4, "r_x3": 340.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 346.8, "t": 583.4, "r": 350.6, "b": 588.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 588.4, "r_x1": 350.6, "r_y1": 588.4, "r_x2": 350.6, "r_y2": 583.4, "r_x3": 346.8, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 333.6, "t": 583.4, "r": 337.4, "b": 588.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 588.3, "r_x1": 337.4, "r_y1": 588.3, "r_x2": 337.4, "r_y2": 583.4, "r_x3": 333.6, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 353.0, "t": 556.9, "r": 359.8, "b": 561.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.0, "r_y0": 561.9, "r_x1": 359.8, "r_y1": 561.9, "r_x2": 359.8, "r_y2": 556.9, "r_x3": 353.0, "r_y3": 556.9, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 353.2, "t": 563.6, "r": 360.0, "b": 568.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 568.6, "r_x1": 360.0, "r_y1": 568.6, "r_x2": 360.0, "r_y2": 563.6, "r_x3": 353.2, "r_y3": 563.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 353.2, "t": 570.2, "r": 360.0, "b": 575.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.2, "r_x1": 360.0, "r_y1": 575.2, "r_x2": 360.0, "r_y2": 570.2, "r_x3": 353.2, "r_y3": 570.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 353.2, "t": 576.8, "r": 360.0, "b": 581.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 581.8, "r_x1": 360.0, "r_y1": 581.8, "r_x2": 360.0, "r_y2": 576.8, "r_x3": 353.2, "r_y3": 576.8, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 353.3, "t": 583.4, "r": 360.1, "b": 588.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.3, "r_y0": 588.4, "r_x1": 360.1, "r_y1": 588.4, "r_x2": 360.1, "r_y2": 583.4, "r_x3": 353.3, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 347.4, "t": 557.1, "r": 350.3, "b": 562.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.4, "r_y0": 562.1, "r_x1": 350.3, "r_y1": 562.1, "r_x2": 350.3, "r_y2": 557.1, "r_x3": 347.4, "r_y3": 557.1, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 331.1, "t": 564.3, "r": 333.7, "b": 568.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.1, "r_y0": 568.6, "r_x1": 333.7, "r_y1": 568.6, "r_x2": 333.7, "r_y2": 564.3, "r_x3": 331.1, "r_y3": 564.3, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 340.8, "t": 554.6, "r": 343.3, "b": 558.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.8, "r_y0": 558.9, "r_x1": 343.3, "r_y1": 558.9, "r_x2": 343.3, "r_y2": 554.6, "r_x3": 340.8, "r_y3": 554.6, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 331.0, "t": 554.8, "r": 333.5, "b": 559.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.0, "r_y0": 559.1, "r_x1": 333.5, "r_y1": 559.1, "r_x2": 333.5, "r_y2": 554.8, "r_x3": 331.0, "r_y3": 554.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 4, "page_no": 7, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.8, "t": 620.2, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 149.7, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 480.6, "r_y1": 664.9, "r_x2": 480.6, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "cells. The predicted OTSL structures were converted back to HTML format in", "orig": "cells. The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for table structure prediction, and Mean Average Precision (mAP) with 0.75 Intersection Over Union (IOU) threshold for the bounding-box predictions of table cells. The predicted OTSL structures were converted back to HTML format in" } ], "headers": [ { "label": "page_header", "id": 9, "page_no": 7, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 139.4, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.83, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 139.4, "r_y1": 101.8, "r_x2": 139.4, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8" }, { "label": "page_header", "id": 8, "page_no": 7, "cluster": { "id": 8, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 8, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 210.8, "r_y1": 151.6, "r_x2": 210.8, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 178.0, "r_x1": 149.4, "r_y1": 178.0, "r_x2": 149.4, "r_y2": 169.2, "r_x3": 134.8, "r_y3": 169.2, "coord_origin": "TOPLEFT" }, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 178.0, "r_x1": 318.4, "r_y1": 178.0, "r_x2": 318.4, "r_y2": 169.2, "r_x3": 160.9, "r_y3": 169.2, "coord_origin": "TOPLEFT" }, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 194.4, "r_x1": 480.6, "r_y1": 194.4, "r_x2": 480.6, "r_y2": 185.6, "r_x3": 134.8, "r_y3": 185.6, "coord_origin": "TOPLEFT" }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 206.3, "r_x1": 480.6, "r_y1": 206.3, "r_x2": 480.6, "r_y2": 197.5, "r_x3": 134.8, "r_y3": 197.5, "coord_origin": "TOPLEFT" }, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 218.3, "r_x1": 480.6, "r_y1": 218.3, "r_x2": 480.6, "r_y2": 209.5, "r_x3": 134.8, "r_y3": 209.5, "coord_origin": "TOPLEFT" }, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 230.2, "r_x1": 480.6, "r_y1": 230.2, "r_x2": 480.6, "r_y2": 221.5, "r_x3": 134.8, "r_y3": 221.5, "coord_origin": "TOPLEFT" }, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 242.2, "r_x1": 440.9, "r_y1": 242.2, "r_x2": 440.9, "r_y2": 233.4, "r_x3": 134.8, "r_y3": 233.4, "coord_origin": "TOPLEFT" }, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.9, "r_y0": 242.2, "r_x1": 480.6, "r_y1": 242.2, "r_x2": 480.6, "r_y2": 233.4, "r_x3": 444.9, "r_y3": 233.4, "coord_origin": "TOPLEFT" }, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 254.2, "r_x1": 145.2, "r_y1": 254.2, "r_x2": 145.2, "r_y2": 245.4, "r_x3": 134.8, "r_y3": 245.4, "coord_origin": "TOPLEFT" }, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.1, "r_y0": 254.2, "r_x1": 311.2, "r_y1": 254.2, "r_x2": 311.2, "r_y2": 245.4, "r_x3": 149.1, "r_y3": 245.4, "coord_origin": "TOPLEFT" }, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.0, "r_x1": 160.1, "r_y1": 283.0, "r_x2": 160.1, "r_y2": 275.1, "r_x3": 134.8, "r_y3": 275.1, "coord_origin": "TOPLEFT" }, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.3, "r_y0": 283.0, "r_x1": 175.6, "r_y1": 283.0, "r_x2": 175.6, "r_y2": 275.1, "r_x3": 167.3, "r_y3": 275.1, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.1, "r_y0": 283.2, "r_x1": 480.6, "r_y1": 283.2, "r_x2": 480.6, "r_y2": 275.1, "r_x3": 188.1, "r_y3": 275.1, "coord_origin": "TOPLEFT" }, "text": "HPO performed in OTSL and HTML representation on the same", "orig": "HPO performed in OTSL and HTML representation on the same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 294.2, "r_x1": 480.6, "r_y1": 294.2, "r_x2": 480.6, "r_y2": 286.1, "r_x3": 134.8, "r_y3": 286.1, "coord_origin": "TOPLEFT" }, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 305.1, "r_x1": 480.6, "r_y1": 305.1, "r_x2": 480.6, "r_y2": 297.1, "r_x3": 134.8, "r_y3": 297.1, "coord_origin": "TOPLEFT" }, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 316.1, "r_x1": 480.6, "r_y1": 316.1, "r_x2": 480.6, "r_y2": 308.0, "r_x3": 134.8, "r_y3": 308.0, "coord_origin": "TOPLEFT" }, "text": "smaller models trained on OTSL perform better, especially in recognizing complex", "orig": "smaller models trained on OTSL perform better, especially in recognizing complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 327.0, "r_x1": 480.6, "r_y1": 327.0, "r_x2": 480.6, "r_y2": 319.0, "r_x3": 134.8, "r_y3": 319.0, "coord_origin": "TOPLEFT" }, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.4, "r_y0": 349.8, "r_x1": 168.0, "r_y1": 349.8, "r_x2": 168.0, "r_y2": 341.7, "r_x3": 160.4, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.6, "r_y0": 362.8, "r_x1": 183.8, "r_y1": 362.8, "r_x2": 183.8, "r_y2": 354.7, "r_x3": 144.6, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.0, "r_y0": 349.8, "r_x1": 215.7, "r_y1": 349.8, "r_x2": 215.7, "r_y2": 341.7, "r_x3": 208.0, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.2, "r_y0": 362.8, "r_x1": 231.4, "r_y1": 362.8, "r_x2": 231.4, "r_y2": 354.7, "r_x3": 192.2, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.3, "r_x1": 278.3, "r_y1": 355.3, "r_x2": 278.3, "r_y2": 347.2, "r_x3": 239.8, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.7, "r_y0": 349.8, "r_x1": 348.3, "r_y1": 349.8, "r_x2": 348.3, "r_y2": 341.7, "r_x3": 324.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 349.8, "r_x1": 417.1, "r_y1": 349.8, "r_x2": 417.1, "r_y2": 341.7, "r_x3": 396.3, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.9, "r_y0": 360.8, "r_x1": 418.5, "r_y1": 360.8, "r_x2": 418.5, "r_y2": 352.7, "r_x3": 394.9, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.8, "r_y0": 349.8, "r_x1": 467.1, "r_y1": 349.8, "r_x2": 467.1, "r_y2": 341.7, "r_x3": 430.8, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.1, "r_y0": 360.8, "r_x1": 470.8, "r_y1": 360.8, "r_x2": 470.8, "r_y2": 352.7, "r_x3": 427.1, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.7, "r_y0": 362.8, "r_x1": 312.3, "r_y1": 362.8, "r_x2": 312.3, "r_y2": 354.7, "r_x3": 286.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.8, "r_x1": 353.7, "r_y1": 362.8, "r_x2": 353.7, "r_y2": 354.7, "r_x3": 320.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.3, "r_y0": 362.8, "r_x1": 379.0, "r_y1": 362.8, "r_x2": 379.0, "r_y2": 354.7, "r_x3": 369.3, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 381.6, "r_x1": 166.5, "r_y1": 381.6, "r_x2": 166.5, "r_y2": 373.5, "r_x3": 161.9, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 381.6, "r_x1": 214.1, "r_y1": 381.6, "r_x2": 214.1, "r_y2": 373.5, "r_x3": 209.5, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 376.1, "r_x1": 271.4, "r_y1": 376.1, "r_x2": 271.4, "r_y2": 368.0, "r_x3": 246.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 376.1, "r_x1": 310.0, "r_y1": 376.1, "r_x2": 310.0, "r_y2": 368.0, "r_x3": 289.0, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 376.1, "r_x1": 347.7, "r_y1": 376.1, "r_x2": 347.7, "r_y2": 368.0, "r_x3": 326.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 376.1, "r_x1": 384.7, "r_y1": 376.1, "r_x2": 384.7, "r_y2": 368.0, "r_x3": 363.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.3, "r_y0": 375.9, "r_x1": 416.1, "r_y1": 375.9, "r_x2": 416.1, "r_y2": 368.0, "r_x3": 397.3, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 375.9, "r_x1": 458.4, "r_y1": 375.9, "r_x2": 458.4, "r_y2": 368.0, "r_x3": 439.5, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 389.1, "r_x1": 272.9, "r_y1": 389.1, "r_x2": 272.9, "r_y2": 381.0, "r_x3": 245.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 389.1, "r_x1": 310.0, "r_y1": 389.1, "r_x2": 310.0, "r_y2": 381.0, "r_x3": 289.0, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 389.1, "r_x1": 347.7, "r_y1": 389.1, "r_x2": 347.7, "r_y2": 381.0, "r_x3": 326.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 389.1, "r_x1": 384.7, "r_y1": 389.1, "r_x2": 384.7, "r_y2": 381.0, "r_x3": 363.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 389.1, "r_x1": 417.2, "r_y1": 389.1, "r_x2": 417.2, "r_y2": 381.0, "r_x3": 396.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 389.1, "r_x1": 457.1, "r_y1": 389.1, "r_x2": 457.1, "r_y2": 381.0, "r_x3": 440.8, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 407.9, "r_x1": 166.5, "r_y1": 407.9, "r_x2": 166.5, "r_y2": 399.8, "r_x3": 161.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 407.9, "r_x1": 214.1, "r_y1": 407.9, "r_x2": 214.1, "r_y2": 399.8, "r_x3": 209.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 402.4, "r_x1": 271.4, "r_y1": 402.4, "r_x2": 271.4, "r_y2": 394.3, "r_x3": 246.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 402.4, "r_x1": 310.0, "r_y1": 402.4, "r_x2": 310.0, "r_y2": 394.3, "r_x3": 289.0, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 402.4, "r_x1": 347.7, "r_y1": 402.4, "r_x2": 347.7, "r_y2": 394.3, "r_x3": 326.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 402.4, "r_x1": 384.7, "r_y1": 402.4, "r_x2": 384.7, "r_y2": 394.3, "r_x3": 363.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 402.2, "r_x1": 418.8, "r_y1": 402.2, "r_x2": 418.8, "r_y2": 394.3, "r_x3": 394.6, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 402.2, "r_x1": 458.4, "r_y1": 402.2, "r_x2": 458.4, "r_y2": 394.3, "r_x3": 439.5, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 415.4, "r_x1": 272.9, "r_y1": 415.4, "r_x2": 272.9, "r_y2": 407.3, "r_x3": 245.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 415.4, "r_x1": 310.0, "r_y1": 415.4, "r_x2": 310.0, "r_y2": 407.3, "r_x3": 289.0, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 415.4, "r_x1": 347.7, "r_y1": 415.4, "r_x2": 347.7, "r_y2": 407.3, "r_x3": 326.7, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 415.2, "r_x1": 386.2, "r_y1": 415.2, "r_x2": 386.2, "r_y2": 407.2, "r_x3": 362.1, "r_y3": 407.2, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 415.4, "r_x1": 417.2, "r_y1": 415.4, "r_x2": 417.2, "r_y2": 407.3, "r_x3": 396.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 415.4, "r_x1": 457.1, "r_y1": 415.4, "r_x2": 457.1, "r_y2": 407.3, "r_x3": 440.8, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 434.2, "r_x1": 166.5, "r_y1": 434.2, "r_x2": 166.5, "r_y2": 426.1, "r_x3": 161.9, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 434.2, "r_x1": 214.1, "r_y1": 434.2, "r_x2": 214.1, "r_y2": 426.1, "r_x3": 209.5, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 428.7, "r_x1": 271.4, "r_y1": 428.7, "r_x2": 271.4, "r_y2": 420.6, "r_x3": 246.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 428.7, "r_x1": 310.0, "r_y1": 428.7, "r_x2": 310.0, "r_y2": 420.6, "r_x3": 289.0, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 428.7, "r_x1": 347.7, "r_y1": 428.7, "r_x2": 347.7, "r_y2": 420.6, "r_x3": 326.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 428.7, "r_x1": 384.7, "r_y1": 428.7, "r_x2": 384.7, "r_y2": 420.6, "r_x3": 363.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 428.5, "r_x1": 418.8, "r_y1": 428.5, "r_x2": 418.8, "r_y2": 420.6, "r_x3": 394.6, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 428.5, "r_x1": 458.4, "r_y1": 428.5, "r_x2": 458.4, "r_y2": 420.6, "r_x3": 439.5, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 441.7, "r_x1": 272.9, "r_y1": 441.7, "r_x2": 272.9, "r_y2": 433.6, "r_x3": 245.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 441.7, "r_x1": 310.0, "r_y1": 441.7, "r_x2": 310.0, "r_y2": 433.6, "r_x3": 289.0, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 441.7, "r_x1": 347.7, "r_y1": 441.7, "r_x2": 347.7, "r_y2": 433.6, "r_x3": 326.7, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 441.5, "r_x1": 386.2, "r_y1": 441.5, "r_x2": 386.2, "r_y2": 433.5, "r_x3": 362.1, "r_y3": 433.5, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 441.7, "r_x1": 417.2, "r_y1": 441.7, "r_x2": 417.2, "r_y2": 433.6, "r_x3": 396.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 441.7, "r_x1": 457.1, "r_y1": 441.7, "r_x2": 457.1, "r_y2": 433.6, "r_x3": 440.8, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 460.5, "r_x1": 166.5, "r_y1": 460.5, "r_x2": 166.5, "r_y2": 452.4, "r_x3": 161.9, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 460.5, "r_x1": 214.1, "r_y1": 460.5, "r_x2": 214.1, "r_y2": 452.4, "r_x3": 209.5, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 455.0, "r_x1": 271.4, "r_y1": 455.0, "r_x2": 271.4, "r_y2": 446.9, "r_x3": 246.7, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 455.0, "r_x1": 310.0, "r_y1": 455.0, "r_x2": 310.0, "r_y2": 446.9, "r_x3": 289.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.0, "r_y0": 455.0, "r_x1": 345.4, "r_y1": 455.0, "r_x2": 345.4, "r_y2": 446.9, "r_x3": 329.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 454.8, "r_x1": 386.2, "r_y1": 454.8, "r_x2": 386.2, "r_y2": 446.9, "r_x3": 362.1, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 454.8, "r_x1": 418.8, "r_y1": 454.8, "r_x2": 418.8, "r_y2": 446.9, "r_x3": 394.6, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 454.8, "r_x1": 458.4, "r_y1": 454.8, "r_x2": 458.4, "r_y2": 446.9, "r_x3": 439.5, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 468.0, "r_x1": 272.9, "r_y1": 468.0, "r_x2": 272.9, "r_y2": 459.9, "r_x3": 245.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 468.0, "r_x1": 310.0, "r_y1": 468.0, "r_x2": 310.0, "r_y2": 459.9, "r_x3": 289.0, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 468.0, "r_x1": 347.7, "r_y1": 468.0, "r_x2": 347.7, "r_y2": 459.9, "r_x3": 326.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 468.0, "r_x1": 384.7, "r_y1": 468.0, "r_x2": 384.7, "r_y2": 459.9, "r_x3": 363.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 468.0, "r_x1": 417.2, "r_y1": 468.0, "r_x2": 417.2, "r_y2": 459.9, "r_x3": 396.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.7, "r_y0": 468.0, "r_x1": 451.3, "r_y1": 468.0, "r_x2": 451.3, "r_y2": 459.9, "r_x3": 446.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 517.0, "r_x1": 149.4, "r_y1": 517.0, "r_x2": 149.4, "r_y2": 508.2, "r_x3": 134.8, "r_y3": 508.2, "coord_origin": "TOPLEFT" }, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 517.0, "r_x1": 264.4, "r_y1": 517.0, "r_x2": 264.4, "r_y2": 508.2, "r_x3": 160.9, "r_y3": 508.2, "coord_origin": "TOPLEFT" }, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.6, "r_x3": 134.8, "r_y3": 524.6, "coord_origin": "TOPLEFT" }, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 480.6, "r_y1": 581.2, "r_x2": 480.6, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 206.8, "r_y1": 617.0, "r_x2": 206.8, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 149.7, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "Additionally, the results show that OTSL has an advantage over HTML", "orig": "Additionally, the results show that OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 405.8, "r_y1": 664.9, "r_x2": 405.8, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 8, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "page_header", "bbox": { "l": 476.0, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 151.6, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 210.8, "r_y1": 151.6, "r_x2": 210.8, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "section_header", "bbox": { "l": 134.8, "t": 169.2, "r": 318.4, "b": 178.0, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 178.0, "r_x1": 149.4, "r_y1": 178.0, "r_x2": 149.4, "r_y2": 169.2, "r_x3": 134.8, "r_y3": 169.2, "coord_origin": "TOPLEFT" }, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 178.0, "r_x1": 318.4, "r_y1": 178.0, "r_x2": 318.4, "r_y2": 169.2, "r_x3": 160.9, "r_y3": 169.2, "coord_origin": "TOPLEFT" }, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 134.8, "t": 185.6, "r": 480.6, "b": 254.2, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 194.4, "r_x1": 480.6, "r_y1": 194.4, "r_x2": 480.6, "r_y2": 185.6, "r_x3": 134.8, "r_y3": 185.6, "coord_origin": "TOPLEFT" }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 206.3, "r_x1": 480.6, "r_y1": 206.3, "r_x2": 480.6, "r_y2": 197.5, "r_x3": 134.8, "r_y3": 197.5, "coord_origin": "TOPLEFT" }, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 218.3, "r_x1": 480.6, "r_y1": 218.3, "r_x2": 480.6, "r_y2": 209.5, "r_x3": 134.8, "r_y3": 209.5, "coord_origin": "TOPLEFT" }, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 230.2, "r_x1": 480.6, "r_y1": 230.2, "r_x2": 480.6, "r_y2": 221.5, "r_x3": 134.8, "r_y3": 221.5, "coord_origin": "TOPLEFT" }, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 242.2, "r_x1": 440.9, "r_y1": 242.2, "r_x2": 440.9, "r_y2": 233.4, "r_x3": 134.8, "r_y3": 233.4, "coord_origin": "TOPLEFT" }, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.9, "r_y0": 242.2, "r_x1": 480.6, "r_y1": 242.2, "r_x2": 480.6, "r_y2": 233.4, "r_x3": 444.9, "r_y3": 233.4, "coord_origin": "TOPLEFT" }, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 254.2, "r_x1": 145.2, "r_y1": 254.2, "r_x2": 145.2, "r_y2": 245.4, "r_x3": 134.8, "r_y3": 245.4, "coord_origin": "TOPLEFT" }, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.1, "r_y0": 254.2, "r_x1": 311.2, "r_y1": 254.2, "r_x2": 311.2, "r_y2": 245.4, "r_x3": 149.1, "r_y3": 245.4, "coord_origin": "TOPLEFT" }, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "caption", "bbox": { "l": 134.8, "t": 275.1, "r": 480.6, "b": 327.0, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.0, "r_x1": 160.1, "r_y1": 283.0, "r_x2": 160.1, "r_y2": 275.1, "r_x3": 134.8, "r_y3": 275.1, "coord_origin": "TOPLEFT" }, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.3, "r_y0": 283.0, "r_x1": 175.6, "r_y1": 283.0, "r_x2": 175.6, "r_y2": 275.1, "r_x3": 167.3, "r_y3": 275.1, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.1, "r_y0": 283.2, "r_x1": 480.6, "r_y1": 283.2, "r_x2": 480.6, "r_y2": 275.1, "r_x3": 188.1, "r_y3": 275.1, "coord_origin": "TOPLEFT" }, "text": "HPO performed in OTSL and HTML representation on the same", "orig": "HPO performed in OTSL and HTML representation on the same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 294.2, "r_x1": 480.6, "r_y1": 294.2, "r_x2": 480.6, "r_y2": 286.1, "r_x3": 134.8, "r_y3": 286.1, "coord_origin": "TOPLEFT" }, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 305.1, "r_x1": 480.6, "r_y1": 305.1, "r_x2": 480.6, "r_y2": 297.1, "r_x3": 134.8, "r_y3": 297.1, "coord_origin": "TOPLEFT" }, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 316.1, "r_x1": 480.6, "r_y1": 316.1, "r_x2": 480.6, "r_y2": 308.0, "r_x3": 134.8, "r_y3": 308.0, "coord_origin": "TOPLEFT" }, "text": "smaller models trained on OTSL perform better, especially in recognizing complex", "orig": "smaller models trained on OTSL perform better, especially in recognizing complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 327.0, "r_x1": 480.6, "r_y1": 327.0, "r_x2": 480.6, "r_y2": 319.0, "r_x3": 134.8, "r_y3": 319.0, "coord_origin": "TOPLEFT" }, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "table", "bbox": { "l": 139.7, "t": 337.6, "r": 475.0, "b": 469.5, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.4, "r_y0": 349.8, "r_x1": 168.0, "r_y1": 349.8, "r_x2": 168.0, "r_y2": 341.7, "r_x3": 160.4, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.6, "r_y0": 362.8, "r_x1": 183.8, "r_y1": 362.8, "r_x2": 183.8, "r_y2": 354.7, "r_x3": 144.6, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.0, "r_y0": 349.8, "r_x1": 215.7, "r_y1": 349.8, "r_x2": 215.7, "r_y2": 341.7, "r_x3": 208.0, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.2, "r_y0": 362.8, "r_x1": 231.4, "r_y1": 362.8, "r_x2": 231.4, "r_y2": 354.7, "r_x3": 192.2, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.3, "r_x1": 278.3, "r_y1": 355.3, "r_x2": 278.3, "r_y2": 347.2, "r_x3": 239.8, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.7, "r_y0": 349.8, "r_x1": 348.3, "r_y1": 349.8, "r_x2": 348.3, "r_y2": 341.7, "r_x3": 324.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 349.8, "r_x1": 417.1, "r_y1": 349.8, "r_x2": 417.1, "r_y2": 341.7, "r_x3": 396.3, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.9, "r_y0": 360.8, "r_x1": 418.5, "r_y1": 360.8, "r_x2": 418.5, "r_y2": 352.7, "r_x3": 394.9, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.8, "r_y0": 349.8, "r_x1": 467.1, "r_y1": 349.8, "r_x2": 467.1, "r_y2": 341.7, "r_x3": 430.8, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.1, "r_y0": 360.8, "r_x1": 470.8, "r_y1": 360.8, "r_x2": 470.8, "r_y2": 352.7, "r_x3": 427.1, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.7, "r_y0": 362.8, "r_x1": 312.3, "r_y1": 362.8, "r_x2": 312.3, "r_y2": 354.7, "r_x3": 286.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.8, "r_x1": 353.7, "r_y1": 362.8, "r_x2": 353.7, "r_y2": 354.7, "r_x3": 320.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.3, "r_y0": 362.8, "r_x1": 379.0, "r_y1": 362.8, "r_x2": 379.0, "r_y2": 354.7, "r_x3": 369.3, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 381.6, "r_x1": 166.5, "r_y1": 381.6, "r_x2": 166.5, "r_y2": 373.5, "r_x3": 161.9, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 381.6, "r_x1": 214.1, "r_y1": 381.6, "r_x2": 214.1, "r_y2": 373.5, "r_x3": 209.5, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 376.1, "r_x1": 271.4, "r_y1": 376.1, "r_x2": 271.4, "r_y2": 368.0, "r_x3": 246.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 376.1, "r_x1": 310.0, "r_y1": 376.1, "r_x2": 310.0, "r_y2": 368.0, "r_x3": 289.0, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 376.1, "r_x1": 347.7, "r_y1": 376.1, "r_x2": 347.7, "r_y2": 368.0, "r_x3": 326.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 376.1, "r_x1": 384.7, "r_y1": 376.1, "r_x2": 384.7, "r_y2": 368.0, "r_x3": 363.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.3, "r_y0": 375.9, "r_x1": 416.1, "r_y1": 375.9, "r_x2": 416.1, "r_y2": 368.0, "r_x3": 397.3, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 375.9, "r_x1": 458.4, "r_y1": 375.9, "r_x2": 458.4, "r_y2": 368.0, "r_x3": 439.5, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 389.1, "r_x1": 272.9, "r_y1": 389.1, "r_x2": 272.9, "r_y2": 381.0, "r_x3": 245.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 389.1, "r_x1": 310.0, "r_y1": 389.1, "r_x2": 310.0, "r_y2": 381.0, "r_x3": 289.0, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 389.1, "r_x1": 347.7, "r_y1": 389.1, "r_x2": 347.7, "r_y2": 381.0, "r_x3": 326.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 389.1, "r_x1": 384.7, "r_y1": 389.1, "r_x2": 384.7, "r_y2": 381.0, "r_x3": 363.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 389.1, "r_x1": 417.2, "r_y1": 389.1, "r_x2": 417.2, "r_y2": 381.0, "r_x3": 396.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 389.1, "r_x1": 457.1, "r_y1": 389.1, "r_x2": 457.1, "r_y2": 381.0, "r_x3": 440.8, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 407.9, "r_x1": 166.5, "r_y1": 407.9, "r_x2": 166.5, "r_y2": 399.8, "r_x3": 161.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 407.9, "r_x1": 214.1, "r_y1": 407.9, "r_x2": 214.1, "r_y2": 399.8, "r_x3": 209.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 402.4, "r_x1": 271.4, "r_y1": 402.4, "r_x2": 271.4, "r_y2": 394.3, "r_x3": 246.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 402.4, "r_x1": 310.0, "r_y1": 402.4, "r_x2": 310.0, "r_y2": 394.3, "r_x3": 289.0, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 402.4, "r_x1": 347.7, "r_y1": 402.4, "r_x2": 347.7, "r_y2": 394.3, "r_x3": 326.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 402.4, "r_x1": 384.7, "r_y1": 402.4, "r_x2": 384.7, "r_y2": 394.3, "r_x3": 363.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 402.2, "r_x1": 418.8, "r_y1": 402.2, "r_x2": 418.8, "r_y2": 394.3, "r_x3": 394.6, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 402.2, "r_x1": 458.4, "r_y1": 402.2, "r_x2": 458.4, "r_y2": 394.3, "r_x3": 439.5, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 415.4, "r_x1": 272.9, "r_y1": 415.4, "r_x2": 272.9, "r_y2": 407.3, "r_x3": 245.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 415.4, "r_x1": 310.0, "r_y1": 415.4, "r_x2": 310.0, "r_y2": 407.3, "r_x3": 289.0, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 415.4, "r_x1": 347.7, "r_y1": 415.4, "r_x2": 347.7, "r_y2": 407.3, "r_x3": 326.7, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 415.2, "r_x1": 386.2, "r_y1": 415.2, "r_x2": 386.2, "r_y2": 407.2, "r_x3": 362.1, "r_y3": 407.2, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 415.4, "r_x1": 417.2, "r_y1": 415.4, "r_x2": 417.2, "r_y2": 407.3, "r_x3": 396.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 415.4, "r_x1": 457.1, "r_y1": 415.4, "r_x2": 457.1, "r_y2": 407.3, "r_x3": 440.8, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 434.2, "r_x1": 166.5, "r_y1": 434.2, "r_x2": 166.5, "r_y2": 426.1, "r_x3": 161.9, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 434.2, "r_x1": 214.1, "r_y1": 434.2, "r_x2": 214.1, "r_y2": 426.1, "r_x3": 209.5, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 428.7, "r_x1": 271.4, "r_y1": 428.7, "r_x2": 271.4, "r_y2": 420.6, "r_x3": 246.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 428.7, "r_x1": 310.0, "r_y1": 428.7, "r_x2": 310.0, "r_y2": 420.6, "r_x3": 289.0, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 428.7, "r_x1": 347.7, "r_y1": 428.7, "r_x2": 347.7, "r_y2": 420.6, "r_x3": 326.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 428.7, "r_x1": 384.7, "r_y1": 428.7, "r_x2": 384.7, "r_y2": 420.6, "r_x3": 363.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 428.5, "r_x1": 418.8, "r_y1": 428.5, "r_x2": 418.8, "r_y2": 420.6, "r_x3": 394.6, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 428.5, "r_x1": 458.4, "r_y1": 428.5, "r_x2": 458.4, "r_y2": 420.6, "r_x3": 439.5, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 441.7, "r_x1": 272.9, "r_y1": 441.7, "r_x2": 272.9, "r_y2": 433.6, "r_x3": 245.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 441.7, "r_x1": 310.0, "r_y1": 441.7, "r_x2": 310.0, "r_y2": 433.6, "r_x3": 289.0, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 441.7, "r_x1": 347.7, "r_y1": 441.7, "r_x2": 347.7, "r_y2": 433.6, "r_x3": 326.7, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 441.5, "r_x1": 386.2, "r_y1": 441.5, "r_x2": 386.2, "r_y2": 433.5, "r_x3": 362.1, "r_y3": 433.5, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 441.7, "r_x1": 417.2, "r_y1": 441.7, "r_x2": 417.2, "r_y2": 433.6, "r_x3": 396.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 441.7, "r_x1": 457.1, "r_y1": 441.7, "r_x2": 457.1, "r_y2": 433.6, "r_x3": 440.8, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 460.5, "r_x1": 166.5, "r_y1": 460.5, "r_x2": 166.5, "r_y2": 452.4, "r_x3": 161.9, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 460.5, "r_x1": 214.1, "r_y1": 460.5, "r_x2": 214.1, "r_y2": 452.4, "r_x3": 209.5, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 455.0, "r_x1": 271.4, "r_y1": 455.0, "r_x2": 271.4, "r_y2": 446.9, "r_x3": 246.7, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 455.0, "r_x1": 310.0, "r_y1": 455.0, "r_x2": 310.0, "r_y2": 446.9, "r_x3": 289.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.0, "r_y0": 455.0, "r_x1": 345.4, "r_y1": 455.0, "r_x2": 345.4, "r_y2": 446.9, "r_x3": 329.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 454.8, "r_x1": 386.2, "r_y1": 454.8, "r_x2": 386.2, "r_y2": 446.9, "r_x3": 362.1, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 454.8, "r_x1": 418.8, "r_y1": 454.8, "r_x2": 418.8, "r_y2": 446.9, "r_x3": 394.6, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 454.8, "r_x1": 458.4, "r_y1": 454.8, "r_x2": 458.4, "r_y2": 446.9, "r_x3": 439.5, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 468.0, "r_x1": 272.9, "r_y1": 468.0, "r_x2": 272.9, "r_y2": 459.9, "r_x3": 245.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 468.0, "r_x1": 310.0, "r_y1": 468.0, "r_x2": 310.0, "r_y2": 459.9, "r_x3": 289.0, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 468.0, "r_x1": 347.7, "r_y1": 468.0, "r_x2": 347.7, "r_y2": 459.9, "r_x3": 326.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 468.0, "r_x1": 384.7, "r_y1": 468.0, "r_x2": 384.7, "r_y2": 459.9, "r_x3": 363.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 468.0, "r_x1": 417.2, "r_y1": 468.0, "r_x2": 417.2, "r_y2": 459.9, "r_x3": 396.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.7, "r_y0": 468.0, "r_x1": 451.3, "r_y1": 468.0, "r_x2": 451.3, "r_y2": 459.9, "r_x3": 446.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 160.4, "t": 341.7, "r": 168.0, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.4, "r_y0": 349.8, "r_x1": 168.0, "r_y1": 349.8, "r_x2": 168.0, "r_y2": 341.7, "r_x3": 160.4, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 144.6, "t": 354.7, "r": 183.8, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.6, "r_y0": 362.8, "r_x1": 183.8, "r_y1": 362.8, "r_x2": 183.8, "r_y2": 354.7, "r_x3": 144.6, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 208.0, "t": 341.7, "r": 215.7, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.0, "r_y0": 349.8, "r_x1": 215.7, "r_y1": 349.8, "r_x2": 215.7, "r_y2": 341.7, "r_x3": 208.0, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 192.2, "t": 354.7, "r": 231.4, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.2, "r_y0": 362.8, "r_x1": 231.4, "r_y1": 362.8, "r_x2": 231.4, "r_y2": 354.7, "r_x3": 192.2, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 239.8, "t": 347.2, "r": 278.3, "b": 355.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.3, "r_x1": 278.3, "r_y1": 355.3, "r_x2": 278.3, "r_y2": 347.2, "r_x3": 239.8, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 324.7, "t": 341.7, "r": 348.3, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.7, "r_y0": 349.8, "r_x1": 348.3, "r_y1": 349.8, "r_x2": 348.3, "r_y2": 341.7, "r_x3": 324.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 396.3, "t": 341.7, "r": 417.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 349.8, "r_x1": 417.1, "r_y1": 349.8, "r_x2": 417.1, "r_y2": 341.7, "r_x3": 396.3, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 394.9, "t": 352.7, "r": 418.5, "b": 360.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.9, "r_y0": 360.8, "r_x1": 418.5, "r_y1": 360.8, "r_x2": 418.5, "r_y2": 352.7, "r_x3": 394.9, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 430.8, "t": 341.7, "r": 467.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.8, "r_y0": 349.8, "r_x1": 467.1, "r_y1": 349.8, "r_x2": 467.1, "r_y2": 341.7, "r_x3": 430.8, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 427.1, "t": 352.7, "r": 470.8, "b": 360.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.1, "r_y0": 360.8, "r_x1": 470.8, "r_y1": 360.8, "r_x2": 470.8, "r_y2": 352.7, "r_x3": 427.1, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 286.7, "t": 354.7, "r": 312.3, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.7, "r_y0": 362.8, "r_x1": 312.3, "r_y1": 362.8, "r_x2": 312.3, "r_y2": 354.7, "r_x3": 286.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 320.7, "t": 354.7, "r": 353.7, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.8, "r_x1": 353.7, "r_y1": 362.8, "r_x2": 353.7, "r_y2": 354.7, "r_x3": 320.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 369.3, "t": 354.7, "r": 379.0, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.3, "r_y0": 362.8, "r_x1": 379.0, "r_y1": 362.8, "r_x2": 379.0, "r_y2": 354.7, "r_x3": 369.3, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 161.9, "t": 373.5, "r": 166.5, "b": 381.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 381.6, "r_x1": 166.5, "r_y1": 381.6, "r_x2": 166.5, "r_y2": 373.5, "r_x3": 161.9, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 209.5, "t": 373.5, "r": 214.1, "b": 381.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 381.6, "r_x1": 214.1, "r_y1": 381.6, "r_x2": 214.1, "r_y2": 373.5, "r_x3": 209.5, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 246.7, "t": 368.0, "r": 271.4, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 376.1, "r_x1": 271.4, "r_y1": 376.1, "r_x2": 271.4, "r_y2": 368.0, "r_x3": 246.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 289.0, "t": 368.0, "r": 310.0, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 376.1, "r_x1": 310.0, "r_y1": 376.1, "r_x2": 310.0, "r_y2": 368.0, "r_x3": 289.0, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 326.7, "t": 368.0, "r": 347.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 376.1, "r_x1": 347.7, "r_y1": 376.1, "r_x2": 347.7, "r_y2": 368.0, "r_x3": 326.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 363.7, "t": 368.0, "r": 384.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 376.1, "r_x1": 384.7, "r_y1": 376.1, "r_x2": 384.7, "r_y2": 368.0, "r_x3": 363.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 397.3, "t": 368.0, "r": 416.1, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.3, "r_y0": 375.9, "r_x1": 416.1, "r_y1": 375.9, "r_x2": 416.1, "r_y2": 368.0, "r_x3": 397.3, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 439.5, "t": 368.0, "r": 458.4, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 375.9, "r_x1": 458.4, "r_y1": 375.9, "r_x2": 458.4, "r_y2": 368.0, "r_x3": 439.5, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 245.2, "t": 381.0, "r": 272.9, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 389.1, "r_x1": 272.9, "r_y1": 389.1, "r_x2": 272.9, "r_y2": 381.0, "r_x3": 245.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 289.0, "t": 381.0, "r": 310.0, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 389.1, "r_x1": 310.0, "r_y1": 389.1, "r_x2": 310.0, "r_y2": 381.0, "r_x3": 289.0, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 326.7, "t": 381.0, "r": 347.7, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 389.1, "r_x1": 347.7, "r_y1": 389.1, "r_x2": 347.7, "r_y2": 381.0, "r_x3": 326.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 363.7, "t": 381.0, "r": 384.7, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 389.1, "r_x1": 384.7, "r_y1": 389.1, "r_x2": 384.7, "r_y2": 381.0, "r_x3": 363.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.2, "t": 381.0, "r": 417.2, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 389.1, "r_x1": 417.2, "r_y1": 389.1, "r_x2": 417.2, "r_y2": 381.0, "r_x3": 396.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 440.8, "t": 381.0, "r": 457.1, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 389.1, "r_x1": 457.1, "r_y1": 389.1, "r_x2": 457.1, "r_y2": 381.0, "r_x3": 440.8, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 161.9, "t": 399.8, "r": 166.5, "b": 407.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 407.9, "r_x1": 166.5, "r_y1": 407.9, "r_x2": 166.5, "r_y2": 399.8, "r_x3": 161.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 209.5, "t": 399.8, "r": 214.1, "b": 407.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 407.9, "r_x1": 214.1, "r_y1": 407.9, "r_x2": 214.1, "r_y2": 399.8, "r_x3": 209.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 246.7, "t": 394.3, "r": 271.4, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 402.4, "r_x1": 271.4, "r_y1": 402.4, "r_x2": 271.4, "r_y2": 394.3, "r_x3": 246.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 289.0, "t": 394.3, "r": 310.0, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 402.4, "r_x1": 310.0, "r_y1": 402.4, "r_x2": 310.0, "r_y2": 394.3, "r_x3": 289.0, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 326.7, "t": 394.3, "r": 347.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 402.4, "r_x1": 347.7, "r_y1": 402.4, "r_x2": 347.7, "r_y2": 394.3, "r_x3": 326.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 363.7, "t": 394.3, "r": 384.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 402.4, "r_x1": 384.7, "r_y1": 402.4, "r_x2": 384.7, "r_y2": 394.3, "r_x3": 363.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 394.6, "t": 394.3, "r": 418.8, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 402.2, "r_x1": 418.8, "r_y1": 402.2, "r_x2": 418.8, "r_y2": 394.3, "r_x3": 394.6, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 439.5, "t": 394.3, "r": 458.4, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 402.2, "r_x1": 458.4, "r_y1": 402.2, "r_x2": 458.4, "r_y2": 394.3, "r_x3": 439.5, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 245.2, "t": 407.3, "r": 272.9, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 415.4, "r_x1": 272.9, "r_y1": 415.4, "r_x2": 272.9, "r_y2": 407.3, "r_x3": 245.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 289.0, "t": 407.3, "r": 310.0, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 415.4, "r_x1": 310.0, "r_y1": 415.4, "r_x2": 310.0, "r_y2": 407.3, "r_x3": 289.0, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 326.7, "t": 407.3, "r": 347.7, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 415.4, "r_x1": 347.7, "r_y1": 415.4, "r_x2": 347.7, "r_y2": 407.3, "r_x3": 326.7, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 362.1, "t": 407.2, "r": 386.2, "b": 415.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 415.2, "r_x1": 386.2, "r_y1": 415.2, "r_x2": 386.2, "r_y2": 407.2, "r_x3": 362.1, "r_y3": 407.2, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 396.2, "t": 407.3, "r": 417.2, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 415.4, "r_x1": 417.2, "r_y1": 415.4, "r_x2": 417.2, "r_y2": 407.3, "r_x3": 396.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 440.8, "t": 407.3, "r": 457.1, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 415.4, "r_x1": 457.1, "r_y1": 415.4, "r_x2": 457.1, "r_y2": 407.3, "r_x3": 440.8, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 161.9, "t": 426.1, "r": 166.5, "b": 434.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 434.2, "r_x1": 166.5, "r_y1": 434.2, "r_x2": 166.5, "r_y2": 426.1, "r_x3": 161.9, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 209.5, "t": 426.1, "r": 214.1, "b": 434.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 434.2, "r_x1": 214.1, "r_y1": 434.2, "r_x2": 214.1, "r_y2": 426.1, "r_x3": 209.5, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 246.7, "t": 420.6, "r": 271.4, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 428.7, "r_x1": 271.4, "r_y1": 428.7, "r_x2": 271.4, "r_y2": 420.6, "r_x3": 246.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 289.0, "t": 420.6, "r": 310.0, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 428.7, "r_x1": 310.0, "r_y1": 428.7, "r_x2": 310.0, "r_y2": 420.6, "r_x3": 289.0, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.7, "t": 420.6, "r": 347.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 428.7, "r_x1": 347.7, "r_y1": 428.7, "r_x2": 347.7, "r_y2": 420.6, "r_x3": 326.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 363.7, "t": 420.6, "r": 384.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 428.7, "r_x1": 384.7, "r_y1": 428.7, "r_x2": 384.7, "r_y2": 420.6, "r_x3": 363.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 394.6, "t": 420.6, "r": 418.8, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 428.5, "r_x1": 418.8, "r_y1": 428.5, "r_x2": 418.8, "r_y2": 420.6, "r_x3": 394.6, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 439.5, "t": 420.6, "r": 458.4, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 428.5, "r_x1": 458.4, "r_y1": 428.5, "r_x2": 458.4, "r_y2": 420.6, "r_x3": 439.5, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 245.2, "t": 433.6, "r": 272.9, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 441.7, "r_x1": 272.9, "r_y1": 441.7, "r_x2": 272.9, "r_y2": 433.6, "r_x3": 245.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 289.0, "t": 433.6, "r": 310.0, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 441.7, "r_x1": 310.0, "r_y1": 441.7, "r_x2": 310.0, "r_y2": 433.6, "r_x3": 289.0, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 326.7, "t": 433.6, "r": 347.7, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 441.7, "r_x1": 347.7, "r_y1": 441.7, "r_x2": 347.7, "r_y2": 433.6, "r_x3": 326.7, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 362.1, "t": 433.5, "r": 386.2, "b": 441.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 441.5, "r_x1": 386.2, "r_y1": 441.5, "r_x2": 386.2, "r_y2": 433.5, "r_x3": 362.1, "r_y3": 433.5, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 396.2, "t": 433.6, "r": 417.2, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 441.7, "r_x1": 417.2, "r_y1": 441.7, "r_x2": 417.2, "r_y2": 433.6, "r_x3": 396.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 440.8, "t": 433.6, "r": 457.1, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 441.7, "r_x1": 457.1, "r_y1": 441.7, "r_x2": 457.1, "r_y2": 433.6, "r_x3": 440.8, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 161.9, "t": 452.4, "r": 166.5, "b": 460.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 460.5, "r_x1": 166.5, "r_y1": 460.5, "r_x2": 166.5, "r_y2": 452.4, "r_x3": 161.9, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 209.5, "t": 452.4, "r": 214.1, "b": 460.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 460.5, "r_x1": 214.1, "r_y1": 460.5, "r_x2": 214.1, "r_y2": 452.4, "r_x3": 209.5, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 246.7, "t": 446.9, "r": 271.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 455.0, "r_x1": 271.4, "r_y1": 455.0, "r_x2": 271.4, "r_y2": 446.9, "r_x3": 246.7, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 289.0, "t": 446.9, "r": 310.0, "b": 455.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 455.0, "r_x1": 310.0, "r_y1": 455.0, "r_x2": 310.0, "r_y2": 446.9, "r_x3": 289.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 329.0, "t": 446.9, "r": 345.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.0, "r_y0": 455.0, "r_x1": 345.4, "r_y1": 455.0, "r_x2": 345.4, "r_y2": 446.9, "r_x3": 329.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 362.1, "t": 446.9, "r": 386.2, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 454.8, "r_x1": 386.2, "r_y1": 454.8, "r_x2": 386.2, "r_y2": 446.9, "r_x3": 362.1, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.6, "t": 446.9, "r": 418.8, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 454.8, "r_x1": 418.8, "r_y1": 454.8, "r_x2": 418.8, "r_y2": 446.9, "r_x3": 394.6, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 439.5, "t": 446.9, "r": 458.4, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 454.8, "r_x1": 458.4, "r_y1": 454.8, "r_x2": 458.4, "r_y2": 446.9, "r_x3": 439.5, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 245.2, "t": 459.9, "r": 272.9, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 468.0, "r_x1": 272.9, "r_y1": 468.0, "r_x2": 272.9, "r_y2": 459.9, "r_x3": 245.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.0, "t": 459.9, "r": 310.0, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 468.0, "r_x1": 310.0, "r_y1": 468.0, "r_x2": 310.0, "r_y2": 459.9, "r_x3": 289.0, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 326.7, "t": 459.9, "r": 347.7, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 468.0, "r_x1": 347.7, "r_y1": 468.0, "r_x2": 347.7, "r_y2": 459.9, "r_x3": 326.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 363.7, "t": 459.9, "r": 384.7, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 468.0, "r_x1": 384.7, "r_y1": 468.0, "r_x2": 384.7, "r_y2": 459.9, "r_x3": 363.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 396.2, "t": 459.9, "r": 417.2, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 468.0, "r_x1": 417.2, "r_y1": 468.0, "r_x2": 417.2, "r_y2": 459.9, "r_x3": 396.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 446.7, "t": 459.9, "r": 451.3, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.7, "r_y0": 468.0, "r_x1": 451.3, "r_y1": 468.0, "r_x2": 451.3, "r_y2": 459.9, "r_x3": 446.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 5, "label": "section_header", "bbox": { "l": 134.8, "t": 508.2, "r": 264.4, "b": 517.0, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 517.0, "r_x1": 149.4, "r_y1": 517.0, "r_x2": 149.4, "r_y2": 508.2, "r_x3": 134.8, "r_y3": 508.2, "coord_origin": "TOPLEFT" }, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 517.0, "r_x1": 264.4, "r_y1": 517.0, "r_x2": 264.4, "r_y2": 508.2, "r_x3": 160.9, "r_y3": 508.2, "coord_origin": "TOPLEFT" }, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 524.6, "r": 480.6, "b": 617.0, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.6, "r_x3": 134.8, "r_y3": 524.6, "coord_origin": "TOPLEFT" }, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 480.6, "r_y1": 581.2, "r_x2": 480.6, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 206.8, "r_y1": 617.0, "r_x2": 206.8, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 620.2, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 149.7, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "Additionally, the results show that OTSL has an advantage over HTML", "orig": "Additionally, the results show that OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 405.8, "r_y1": 664.9, "r_x2": 405.8, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": { "0": { "label": "table", "id": 0, "page_no": 8, "cluster": { "id": 0, "label": "table", "bbox": { "l": 139.7, "t": 337.6, "r": 475.0, "b": 469.5, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.4, "r_y0": 349.8, "r_x1": 168.0, "r_y1": 349.8, "r_x2": 168.0, "r_y2": 341.7, "r_x3": 160.4, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.6, "r_y0": 362.8, "r_x1": 183.8, "r_y1": 362.8, "r_x2": 183.8, "r_y2": 354.7, "r_x3": 144.6, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.0, "r_y0": 349.8, "r_x1": 215.7, "r_y1": 349.8, "r_x2": 215.7, "r_y2": 341.7, "r_x3": 208.0, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.2, "r_y0": 362.8, "r_x1": 231.4, "r_y1": 362.8, "r_x2": 231.4, "r_y2": 354.7, "r_x3": 192.2, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.3, "r_x1": 278.3, "r_y1": 355.3, "r_x2": 278.3, "r_y2": 347.2, "r_x3": 239.8, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.7, "r_y0": 349.8, "r_x1": 348.3, "r_y1": 349.8, "r_x2": 348.3, "r_y2": 341.7, "r_x3": 324.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 349.8, "r_x1": 417.1, "r_y1": 349.8, "r_x2": 417.1, "r_y2": 341.7, "r_x3": 396.3, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.9, "r_y0": 360.8, "r_x1": 418.5, "r_y1": 360.8, "r_x2": 418.5, "r_y2": 352.7, "r_x3": 394.9, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.8, "r_y0": 349.8, "r_x1": 467.1, "r_y1": 349.8, "r_x2": 467.1, "r_y2": 341.7, "r_x3": 430.8, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.1, "r_y0": 360.8, "r_x1": 470.8, "r_y1": 360.8, "r_x2": 470.8, "r_y2": 352.7, "r_x3": 427.1, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.7, "r_y0": 362.8, "r_x1": 312.3, "r_y1": 362.8, "r_x2": 312.3, "r_y2": 354.7, "r_x3": 286.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.8, "r_x1": 353.7, "r_y1": 362.8, "r_x2": 353.7, "r_y2": 354.7, "r_x3": 320.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.3, "r_y0": 362.8, "r_x1": 379.0, "r_y1": 362.8, "r_x2": 379.0, "r_y2": 354.7, "r_x3": 369.3, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 381.6, "r_x1": 166.5, "r_y1": 381.6, "r_x2": 166.5, "r_y2": 373.5, "r_x3": 161.9, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 381.6, "r_x1": 214.1, "r_y1": 381.6, "r_x2": 214.1, "r_y2": 373.5, "r_x3": 209.5, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 376.1, "r_x1": 271.4, "r_y1": 376.1, "r_x2": 271.4, "r_y2": 368.0, "r_x3": 246.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 376.1, "r_x1": 310.0, "r_y1": 376.1, "r_x2": 310.0, "r_y2": 368.0, "r_x3": 289.0, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 376.1, "r_x1": 347.7, "r_y1": 376.1, "r_x2": 347.7, "r_y2": 368.0, "r_x3": 326.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 376.1, "r_x1": 384.7, "r_y1": 376.1, "r_x2": 384.7, "r_y2": 368.0, "r_x3": 363.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.3, "r_y0": 375.9, "r_x1": 416.1, "r_y1": 375.9, "r_x2": 416.1, "r_y2": 368.0, "r_x3": 397.3, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 375.9, "r_x1": 458.4, "r_y1": 375.9, "r_x2": 458.4, "r_y2": 368.0, "r_x3": 439.5, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 389.1, "r_x1": 272.9, "r_y1": 389.1, "r_x2": 272.9, "r_y2": 381.0, "r_x3": 245.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 389.1, "r_x1": 310.0, "r_y1": 389.1, "r_x2": 310.0, "r_y2": 381.0, "r_x3": 289.0, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 389.1, "r_x1": 347.7, "r_y1": 389.1, "r_x2": 347.7, "r_y2": 381.0, "r_x3": 326.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 389.1, "r_x1": 384.7, "r_y1": 389.1, "r_x2": 384.7, "r_y2": 381.0, "r_x3": 363.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 389.1, "r_x1": 417.2, "r_y1": 389.1, "r_x2": 417.2, "r_y2": 381.0, "r_x3": 396.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 389.1, "r_x1": 457.1, "r_y1": 389.1, "r_x2": 457.1, "r_y2": 381.0, "r_x3": 440.8, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 407.9, "r_x1": 166.5, "r_y1": 407.9, "r_x2": 166.5, "r_y2": 399.8, "r_x3": 161.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 407.9, "r_x1": 214.1, "r_y1": 407.9, "r_x2": 214.1, "r_y2": 399.8, "r_x3": 209.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 402.4, "r_x1": 271.4, "r_y1": 402.4, "r_x2": 271.4, "r_y2": 394.3, "r_x3": 246.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 402.4, "r_x1": 310.0, "r_y1": 402.4, "r_x2": 310.0, "r_y2": 394.3, "r_x3": 289.0, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 402.4, "r_x1": 347.7, "r_y1": 402.4, "r_x2": 347.7, "r_y2": 394.3, "r_x3": 326.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 402.4, "r_x1": 384.7, "r_y1": 402.4, "r_x2": 384.7, "r_y2": 394.3, "r_x3": 363.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 402.2, "r_x1": 418.8, "r_y1": 402.2, "r_x2": 418.8, "r_y2": 394.3, "r_x3": 394.6, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 402.2, "r_x1": 458.4, "r_y1": 402.2, "r_x2": 458.4, "r_y2": 394.3, "r_x3": 439.5, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 415.4, "r_x1": 272.9, "r_y1": 415.4, "r_x2": 272.9, "r_y2": 407.3, "r_x3": 245.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 415.4, "r_x1": 310.0, "r_y1": 415.4, "r_x2": 310.0, "r_y2": 407.3, "r_x3": 289.0, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 415.4, "r_x1": 347.7, "r_y1": 415.4, "r_x2": 347.7, "r_y2": 407.3, "r_x3": 326.7, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 415.2, "r_x1": 386.2, "r_y1": 415.2, "r_x2": 386.2, "r_y2": 407.2, "r_x3": 362.1, "r_y3": 407.2, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 415.4, "r_x1": 417.2, "r_y1": 415.4, "r_x2": 417.2, "r_y2": 407.3, "r_x3": 396.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 415.4, "r_x1": 457.1, "r_y1": 415.4, "r_x2": 457.1, "r_y2": 407.3, "r_x3": 440.8, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 434.2, "r_x1": 166.5, "r_y1": 434.2, "r_x2": 166.5, "r_y2": 426.1, "r_x3": 161.9, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 434.2, "r_x1": 214.1, "r_y1": 434.2, "r_x2": 214.1, "r_y2": 426.1, "r_x3": 209.5, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 428.7, "r_x1": 271.4, "r_y1": 428.7, "r_x2": 271.4, "r_y2": 420.6, "r_x3": 246.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 428.7, "r_x1": 310.0, "r_y1": 428.7, "r_x2": 310.0, "r_y2": 420.6, "r_x3": 289.0, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 428.7, "r_x1": 347.7, "r_y1": 428.7, "r_x2": 347.7, "r_y2": 420.6, "r_x3": 326.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 428.7, "r_x1": 384.7, "r_y1": 428.7, "r_x2": 384.7, "r_y2": 420.6, "r_x3": 363.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 428.5, "r_x1": 418.8, "r_y1": 428.5, "r_x2": 418.8, "r_y2": 420.6, "r_x3": 394.6, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 428.5, "r_x1": 458.4, "r_y1": 428.5, "r_x2": 458.4, "r_y2": 420.6, "r_x3": 439.5, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 441.7, "r_x1": 272.9, "r_y1": 441.7, "r_x2": 272.9, "r_y2": 433.6, "r_x3": 245.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 441.7, "r_x1": 310.0, "r_y1": 441.7, "r_x2": 310.0, "r_y2": 433.6, "r_x3": 289.0, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 441.7, "r_x1": 347.7, "r_y1": 441.7, "r_x2": 347.7, "r_y2": 433.6, "r_x3": 326.7, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 441.5, "r_x1": 386.2, "r_y1": 441.5, "r_x2": 386.2, "r_y2": 433.5, "r_x3": 362.1, "r_y3": 433.5, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 441.7, "r_x1": 417.2, "r_y1": 441.7, "r_x2": 417.2, "r_y2": 433.6, "r_x3": 396.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 441.7, "r_x1": 457.1, "r_y1": 441.7, "r_x2": 457.1, "r_y2": 433.6, "r_x3": 440.8, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 460.5, "r_x1": 166.5, "r_y1": 460.5, "r_x2": 166.5, "r_y2": 452.4, "r_x3": 161.9, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 460.5, "r_x1": 214.1, "r_y1": 460.5, "r_x2": 214.1, "r_y2": 452.4, "r_x3": 209.5, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 455.0, "r_x1": 271.4, "r_y1": 455.0, "r_x2": 271.4, "r_y2": 446.9, "r_x3": 246.7, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 455.0, "r_x1": 310.0, "r_y1": 455.0, "r_x2": 310.0, "r_y2": 446.9, "r_x3": 289.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.0, "r_y0": 455.0, "r_x1": 345.4, "r_y1": 455.0, "r_x2": 345.4, "r_y2": 446.9, "r_x3": 329.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 454.8, "r_x1": 386.2, "r_y1": 454.8, "r_x2": 386.2, "r_y2": 446.9, "r_x3": 362.1, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 454.8, "r_x1": 418.8, "r_y1": 454.8, "r_x2": 418.8, "r_y2": 446.9, "r_x3": 394.6, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 454.8, "r_x1": 458.4, "r_y1": 454.8, "r_x2": 458.4, "r_y2": 446.9, "r_x3": 439.5, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 468.0, "r_x1": 272.9, "r_y1": 468.0, "r_x2": 272.9, "r_y2": 459.9, "r_x3": 245.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 468.0, "r_x1": 310.0, "r_y1": 468.0, "r_x2": 310.0, "r_y2": 459.9, "r_x3": 289.0, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 468.0, "r_x1": 347.7, "r_y1": 468.0, "r_x2": 347.7, "r_y2": 459.9, "r_x3": 326.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 468.0, "r_x1": 384.7, "r_y1": 468.0, "r_x2": 384.7, "r_y2": 459.9, "r_x3": 363.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 468.0, "r_x1": 417.2, "r_y1": 468.0, "r_x2": 417.2, "r_y2": 459.9, "r_x3": 396.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.7, "r_y0": 468.0, "r_x1": 451.3, "r_y1": 468.0, "r_x2": 451.3, "r_y2": 459.9, "r_x3": 446.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 160.4, "t": 341.7, "r": 168.0, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.4, "r_y0": 349.8, "r_x1": 168.0, "r_y1": 349.8, "r_x2": 168.0, "r_y2": 341.7, "r_x3": 160.4, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 144.6, "t": 354.7, "r": 183.8, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.6, "r_y0": 362.8, "r_x1": 183.8, "r_y1": 362.8, "r_x2": 183.8, "r_y2": 354.7, "r_x3": 144.6, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 208.0, "t": 341.7, "r": 215.7, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.0, "r_y0": 349.8, "r_x1": 215.7, "r_y1": 349.8, "r_x2": 215.7, "r_y2": 341.7, "r_x3": 208.0, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 192.2, "t": 354.7, "r": 231.4, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.2, "r_y0": 362.8, "r_x1": 231.4, "r_y1": 362.8, "r_x2": 231.4, "r_y2": 354.7, "r_x3": 192.2, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 239.8, "t": 347.2, "r": 278.3, "b": 355.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.3, "r_x1": 278.3, "r_y1": 355.3, "r_x2": 278.3, "r_y2": 347.2, "r_x3": 239.8, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 324.7, "t": 341.7, "r": 348.3, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.7, "r_y0": 349.8, "r_x1": 348.3, "r_y1": 349.8, "r_x2": 348.3, "r_y2": 341.7, "r_x3": 324.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 396.3, "t": 341.7, "r": 417.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 349.8, "r_x1": 417.1, "r_y1": 349.8, "r_x2": 417.1, "r_y2": 341.7, "r_x3": 396.3, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 394.9, "t": 352.7, "r": 418.5, "b": 360.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.9, "r_y0": 360.8, "r_x1": 418.5, "r_y1": 360.8, "r_x2": 418.5, "r_y2": 352.7, "r_x3": 394.9, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 430.8, "t": 341.7, "r": 467.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.8, "r_y0": 349.8, "r_x1": 467.1, "r_y1": 349.8, "r_x2": 467.1, "r_y2": 341.7, "r_x3": 430.8, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 427.1, "t": 352.7, "r": 470.8, "b": 360.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.1, "r_y0": 360.8, "r_x1": 470.8, "r_y1": 360.8, "r_x2": 470.8, "r_y2": 352.7, "r_x3": 427.1, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 286.7, "t": 354.7, "r": 312.3, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.7, "r_y0": 362.8, "r_x1": 312.3, "r_y1": 362.8, "r_x2": 312.3, "r_y2": 354.7, "r_x3": 286.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 320.7, "t": 354.7, "r": 353.7, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.8, "r_x1": 353.7, "r_y1": 362.8, "r_x2": 353.7, "r_y2": 354.7, "r_x3": 320.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 369.3, "t": 354.7, "r": 379.0, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.3, "r_y0": 362.8, "r_x1": 379.0, "r_y1": 362.8, "r_x2": 379.0, "r_y2": 354.7, "r_x3": 369.3, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 161.9, "t": 373.5, "r": 166.5, "b": 381.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 381.6, "r_x1": 166.5, "r_y1": 381.6, "r_x2": 166.5, "r_y2": 373.5, "r_x3": 161.9, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 209.5, "t": 373.5, "r": 214.1, "b": 381.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 381.6, "r_x1": 214.1, "r_y1": 381.6, "r_x2": 214.1, "r_y2": 373.5, "r_x3": 209.5, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 246.7, "t": 368.0, "r": 271.4, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 376.1, "r_x1": 271.4, "r_y1": 376.1, "r_x2": 271.4, "r_y2": 368.0, "r_x3": 246.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 289.0, "t": 368.0, "r": 310.0, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 376.1, "r_x1": 310.0, "r_y1": 376.1, "r_x2": 310.0, "r_y2": 368.0, "r_x3": 289.0, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 326.7, "t": 368.0, "r": 347.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 376.1, "r_x1": 347.7, "r_y1": 376.1, "r_x2": 347.7, "r_y2": 368.0, "r_x3": 326.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 363.7, "t": 368.0, "r": 384.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 376.1, "r_x1": 384.7, "r_y1": 376.1, "r_x2": 384.7, "r_y2": 368.0, "r_x3": 363.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 397.3, "t": 368.0, "r": 416.1, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.3, "r_y0": 375.9, "r_x1": 416.1, "r_y1": 375.9, "r_x2": 416.1, "r_y2": 368.0, "r_x3": 397.3, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 439.5, "t": 368.0, "r": 458.4, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 375.9, "r_x1": 458.4, "r_y1": 375.9, "r_x2": 458.4, "r_y2": 368.0, "r_x3": 439.5, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 245.2, "t": 381.0, "r": 272.9, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 389.1, "r_x1": 272.9, "r_y1": 389.1, "r_x2": 272.9, "r_y2": 381.0, "r_x3": 245.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 289.0, "t": 381.0, "r": 310.0, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 389.1, "r_x1": 310.0, "r_y1": 389.1, "r_x2": 310.0, "r_y2": 381.0, "r_x3": 289.0, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 326.7, "t": 381.0, "r": 347.7, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 389.1, "r_x1": 347.7, "r_y1": 389.1, "r_x2": 347.7, "r_y2": 381.0, "r_x3": 326.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 363.7, "t": 381.0, "r": 384.7, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 389.1, "r_x1": 384.7, "r_y1": 389.1, "r_x2": 384.7, "r_y2": 381.0, "r_x3": 363.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.2, "t": 381.0, "r": 417.2, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 389.1, "r_x1": 417.2, "r_y1": 389.1, "r_x2": 417.2, "r_y2": 381.0, "r_x3": 396.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 440.8, "t": 381.0, "r": 457.1, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 389.1, "r_x1": 457.1, "r_y1": 389.1, "r_x2": 457.1, "r_y2": 381.0, "r_x3": 440.8, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 161.9, "t": 399.8, "r": 166.5, "b": 407.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 407.9, "r_x1": 166.5, "r_y1": 407.9, "r_x2": 166.5, "r_y2": 399.8, "r_x3": 161.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 209.5, "t": 399.8, "r": 214.1, "b": 407.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 407.9, "r_x1": 214.1, "r_y1": 407.9, "r_x2": 214.1, "r_y2": 399.8, "r_x3": 209.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 246.7, "t": 394.3, "r": 271.4, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 402.4, "r_x1": 271.4, "r_y1": 402.4, "r_x2": 271.4, "r_y2": 394.3, "r_x3": 246.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 289.0, "t": 394.3, "r": 310.0, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 402.4, "r_x1": 310.0, "r_y1": 402.4, "r_x2": 310.0, "r_y2": 394.3, "r_x3": 289.0, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 326.7, "t": 394.3, "r": 347.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 402.4, "r_x1": 347.7, "r_y1": 402.4, "r_x2": 347.7, "r_y2": 394.3, "r_x3": 326.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 363.7, "t": 394.3, "r": 384.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 402.4, "r_x1": 384.7, "r_y1": 402.4, "r_x2": 384.7, "r_y2": 394.3, "r_x3": 363.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 394.6, "t": 394.3, "r": 418.8, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 402.2, "r_x1": 418.8, "r_y1": 402.2, "r_x2": 418.8, "r_y2": 394.3, "r_x3": 394.6, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 439.5, "t": 394.3, "r": 458.4, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 402.2, "r_x1": 458.4, "r_y1": 402.2, "r_x2": 458.4, "r_y2": 394.3, "r_x3": 439.5, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 245.2, "t": 407.3, "r": 272.9, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 415.4, "r_x1": 272.9, "r_y1": 415.4, "r_x2": 272.9, "r_y2": 407.3, "r_x3": 245.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 289.0, "t": 407.3, "r": 310.0, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 415.4, "r_x1": 310.0, "r_y1": 415.4, "r_x2": 310.0, "r_y2": 407.3, "r_x3": 289.0, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 326.7, "t": 407.3, "r": 347.7, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 415.4, "r_x1": 347.7, "r_y1": 415.4, "r_x2": 347.7, "r_y2": 407.3, "r_x3": 326.7, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 362.1, "t": 407.2, "r": 386.2, "b": 415.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 415.2, "r_x1": 386.2, "r_y1": 415.2, "r_x2": 386.2, "r_y2": 407.2, "r_x3": 362.1, "r_y3": 407.2, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 396.2, "t": 407.3, "r": 417.2, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 415.4, "r_x1": 417.2, "r_y1": 415.4, "r_x2": 417.2, "r_y2": 407.3, "r_x3": 396.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 440.8, "t": 407.3, "r": 457.1, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 415.4, "r_x1": 457.1, "r_y1": 415.4, "r_x2": 457.1, "r_y2": 407.3, "r_x3": 440.8, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 161.9, "t": 426.1, "r": 166.5, "b": 434.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 434.2, "r_x1": 166.5, "r_y1": 434.2, "r_x2": 166.5, "r_y2": 426.1, "r_x3": 161.9, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 209.5, "t": 426.1, "r": 214.1, "b": 434.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 434.2, "r_x1": 214.1, "r_y1": 434.2, "r_x2": 214.1, "r_y2": 426.1, "r_x3": 209.5, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 246.7, "t": 420.6, "r": 271.4, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 428.7, "r_x1": 271.4, "r_y1": 428.7, "r_x2": 271.4, "r_y2": 420.6, "r_x3": 246.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 289.0, "t": 420.6, "r": 310.0, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 428.7, "r_x1": 310.0, "r_y1": 428.7, "r_x2": 310.0, "r_y2": 420.6, "r_x3": 289.0, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.7, "t": 420.6, "r": 347.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 428.7, "r_x1": 347.7, "r_y1": 428.7, "r_x2": 347.7, "r_y2": 420.6, "r_x3": 326.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 363.7, "t": 420.6, "r": 384.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 428.7, "r_x1": 384.7, "r_y1": 428.7, "r_x2": 384.7, "r_y2": 420.6, "r_x3": 363.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 394.6, "t": 420.6, "r": 418.8, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 428.5, "r_x1": 418.8, "r_y1": 428.5, "r_x2": 418.8, "r_y2": 420.6, "r_x3": 394.6, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 439.5, "t": 420.6, "r": 458.4, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 428.5, "r_x1": 458.4, "r_y1": 428.5, "r_x2": 458.4, "r_y2": 420.6, "r_x3": 439.5, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 245.2, "t": 433.6, "r": 272.9, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 441.7, "r_x1": 272.9, "r_y1": 441.7, "r_x2": 272.9, "r_y2": 433.6, "r_x3": 245.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 289.0, "t": 433.6, "r": 310.0, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 441.7, "r_x1": 310.0, "r_y1": 441.7, "r_x2": 310.0, "r_y2": 433.6, "r_x3": 289.0, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 326.7, "t": 433.6, "r": 347.7, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 441.7, "r_x1": 347.7, "r_y1": 441.7, "r_x2": 347.7, "r_y2": 433.6, "r_x3": 326.7, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 362.1, "t": 433.5, "r": 386.2, "b": 441.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 441.5, "r_x1": 386.2, "r_y1": 441.5, "r_x2": 386.2, "r_y2": 433.5, "r_x3": 362.1, "r_y3": 433.5, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 396.2, "t": 433.6, "r": 417.2, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 441.7, "r_x1": 417.2, "r_y1": 441.7, "r_x2": 417.2, "r_y2": 433.6, "r_x3": 396.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 440.8, "t": 433.6, "r": 457.1, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 441.7, "r_x1": 457.1, "r_y1": 441.7, "r_x2": 457.1, "r_y2": 433.6, "r_x3": 440.8, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 161.9, "t": 452.4, "r": 166.5, "b": 460.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 460.5, "r_x1": 166.5, "r_y1": 460.5, "r_x2": 166.5, "r_y2": 452.4, "r_x3": 161.9, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 209.5, "t": 452.4, "r": 214.1, "b": 460.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 460.5, "r_x1": 214.1, "r_y1": 460.5, "r_x2": 214.1, "r_y2": 452.4, "r_x3": 209.5, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 246.7, "t": 446.9, "r": 271.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 455.0, "r_x1": 271.4, "r_y1": 455.0, "r_x2": 271.4, "r_y2": 446.9, "r_x3": 246.7, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 289.0, "t": 446.9, "r": 310.0, "b": 455.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 455.0, "r_x1": 310.0, "r_y1": 455.0, "r_x2": 310.0, "r_y2": 446.9, "r_x3": 289.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 329.0, "t": 446.9, "r": 345.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.0, "r_y0": 455.0, "r_x1": 345.4, "r_y1": 455.0, "r_x2": 345.4, "r_y2": 446.9, "r_x3": 329.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 362.1, "t": 446.9, "r": 386.2, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 454.8, "r_x1": 386.2, "r_y1": 454.8, "r_x2": 386.2, "r_y2": 446.9, "r_x3": 362.1, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.6, "t": 446.9, "r": 418.8, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 454.8, "r_x1": 418.8, "r_y1": 454.8, "r_x2": 418.8, "r_y2": 446.9, "r_x3": 394.6, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 439.5, "t": 446.9, "r": 458.4, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 454.8, "r_x1": 458.4, "r_y1": 454.8, "r_x2": 458.4, "r_y2": 446.9, "r_x3": 439.5, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 245.2, "t": 459.9, "r": 272.9, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 468.0, "r_x1": 272.9, "r_y1": 468.0, "r_x2": 272.9, "r_y2": 459.9, "r_x3": 245.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.0, "t": 459.9, "r": 310.0, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 468.0, "r_x1": 310.0, "r_y1": 468.0, "r_x2": 310.0, "r_y2": 459.9, "r_x3": 289.0, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 326.7, "t": 459.9, "r": 347.7, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 468.0, "r_x1": 347.7, "r_y1": 468.0, "r_x2": 347.7, "r_y2": 459.9, "r_x3": 326.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 363.7, "t": 459.9, "r": 384.7, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 468.0, "r_x1": 384.7, "r_y1": 468.0, "r_x2": 384.7, "r_y2": 459.9, "r_x3": 363.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 396.2, "t": 459.9, "r": 417.2, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 468.0, "r_x1": 417.2, "r_y1": 468.0, "r_x2": 417.2, "r_y2": 459.9, "r_x3": 396.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 446.7, "t": 459.9, "r": 451.3, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.7, "r_y0": 468.0, "r_x1": 451.3, "r_y1": 468.0, "r_x2": 451.3, "r_y2": 459.9, "r_x3": 446.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 6, "num_cols": 8, "table_cells": [ { "bbox": { "l": 160.4, "t": 341.7, "r": 168.0, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "# enc-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 208.0, "t": 341.7, "r": 215.7, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "# dec-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 239.8, "t": 347.2, "r": 278.3, "b": 355.3, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 324.7, "t": 341.7, "r": 348.3, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 6, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 396.3, "t": 341.7, "r": 417.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 394.9, "t": 352.7, "r": 418.5, "b": 360.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 430.8, "t": 341.7, "r": 467.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "Inference", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.1, "t": 352.7, "r": 470.8, "b": 360.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 286.7, "t": 354.7, "r": 312.3, "b": 362.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 320.7, "t": 354.7, "r": 353.7, "b": 362.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 369.3, "t": 354.7, "r": 379.0, "b": 362.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 161.9, "t": 373.5, "r": 166.5, "b": 381.6, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.5, "t": 373.5, "r": 214.1, "b": 381.6, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.7, "t": 368.0, "r": 271.4, "b": 376.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.0, "t": 368.0, "r": 310.0, "b": 376.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.7, "t": 368.0, "r": 347.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.7, "t": 368.0, "r": 384.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 397.3, "t": 368.0, "r": 416.1, "b": 375.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.5, "t": 368.0, "r": 458.4, "b": 375.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.9, "t": 399.8, "r": 166.5, "b": 407.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.5, "t": 399.8, "r": 214.1, "b": 407.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.7, "t": 394.3, "r": 271.4, "b": 402.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.0, "t": 394.3, "r": 310.0, "b": 402.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.938 0.952", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.7, "t": 394.3, "r": 347.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.904 0.909", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.7, "t": 394.3, "r": 384.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.927 0.938", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.6, "t": 394.3, "r": 418.8, "b": 402.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.853 0.843", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.5, "t": 394.3, "r": 458.4, "b": 402.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.97 3.77", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.9, "t": 426.1, "r": 166.5, "b": 434.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.5, "t": 426.1, "r": 214.1, "b": 434.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.7, "t": 420.6, "r": 271.4, "b": 428.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.0, "t": 420.6, "r": 310.0, "b": 428.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.923 0.945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.7, "t": 420.6, "r": 347.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.897 0.901", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.7, "t": 420.6, "r": 384.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.915 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.6, "t": 420.6, "r": 418.8, "b": 428.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.859 0.834", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.5, "t": 420.6, "r": 458.4, "b": 428.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.91 3.81", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.9, "t": 452.4, "r": 166.5, "b": 460.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.5, "t": 452.4, "r": 214.1, "b": 460.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.7, "t": 446.9, "r": 271.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.0, "t": 446.9, "r": 310.0, "b": 455.0, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.952 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 329.0, "t": 446.9, "r": 345.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.92 0.903", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 362.1, "t": 446.9, "r": 386.2, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.942 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.6, "t": 446.9, "r": 418.8, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.857 0.824", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.5, "t": 446.9, "r": 458.4, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.22 2", "column_header": false, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 8, "page_no": 8, "cluster": { "id": 8, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 9, "page_no": 8, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 476.0, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9" }, { "label": "text", "id": 4, "page_no": 8, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 151.6, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 210.8, "r_y1": 151.6, "r_x2": 210.8, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "order to compute the TED score. Inference timing results for all experiments were obtained from the same machine on a single core with AMD EPYC 7763 CPU @2.45 GHz." }, { "label": "section_header", "id": 6, "page_no": 8, "cluster": { "id": 6, "label": "section_header", "bbox": { "l": 134.8, "t": 169.2, "r": 318.4, "b": 178.0, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 178.0, "r_x1": 149.4, "r_y1": 178.0, "r_x2": 149.4, "r_y2": 169.2, "r_x3": 134.8, "r_y3": 169.2, "coord_origin": "TOPLEFT" }, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 178.0, "r_x1": 318.4, "r_y1": 178.0, "r_x2": 318.4, "r_y2": 169.2, "r_x3": 160.9, "r_y3": 169.2, "coord_origin": "TOPLEFT" }, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.1 Hyper Parameter Optimization" }, { "label": "text", "id": 3, "page_no": 8, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.8, "t": 185.6, "r": 480.6, "b": 254.2, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 194.4, "r_x1": 480.6, "r_y1": 194.4, "r_x2": 480.6, "r_y2": 185.6, "r_x3": 134.8, "r_y3": 185.6, "coord_origin": "TOPLEFT" }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 206.3, "r_x1": 480.6, "r_y1": 206.3, "r_x2": 480.6, "r_y2": 197.5, "r_x3": 134.8, "r_y3": 197.5, "coord_origin": "TOPLEFT" }, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 218.3, "r_x1": 480.6, "r_y1": 218.3, "r_x2": 480.6, "r_y2": 209.5, "r_x3": 134.8, "r_y3": 209.5, "coord_origin": "TOPLEFT" }, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 230.2, "r_x1": 480.6, "r_y1": 230.2, "r_x2": 480.6, "r_y2": 221.5, "r_x3": 134.8, "r_y3": 221.5, "coord_origin": "TOPLEFT" }, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 242.2, "r_x1": 440.9, "r_y1": 242.2, "r_x2": 440.9, "r_y2": 233.4, "r_x3": 134.8, "r_y3": 233.4, "coord_origin": "TOPLEFT" }, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.9, "r_y0": 242.2, "r_x1": 480.6, "r_y1": 242.2, "r_x2": 480.6, "r_y2": 233.4, "r_x3": 444.9, "r_y3": 233.4, "coord_origin": "TOPLEFT" }, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 254.2, "r_x1": 145.2, "r_y1": 254.2, "r_x2": 145.2, "r_y2": 245.4, "r_x3": 134.8, "r_y3": 245.4, "coord_origin": "TOPLEFT" }, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.1, "r_y0": 254.2, "r_x1": 311.2, "r_y1": 254.2, "r_x2": 311.2, "r_y2": 245.4, "r_x3": 149.1, "r_y3": 245.4, "coord_origin": "TOPLEFT" }, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a highly diverse set of tables. Also we report TED scores separately for simple and complex tables (tables with cell spans). Results are presented in Table. 1. It is evident that with OTSL, our model achieves the same TED score and slightly better mAP scores in comparison to HTML. However OTSL yields a 2x speed up in the inference runtime over HTML." }, { "label": "caption", "id": 7, "page_no": 8, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 134.8, "t": 275.1, "r": 480.6, "b": 327.0, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.0, "r_x1": 160.1, "r_y1": 283.0, "r_x2": 160.1, "r_y2": 275.1, "r_x3": 134.8, "r_y3": 275.1, "coord_origin": "TOPLEFT" }, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.3, "r_y0": 283.0, "r_x1": 175.6, "r_y1": 283.0, "r_x2": 175.6, "r_y2": 275.1, "r_x3": 167.3, "r_y3": 275.1, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.1, "r_y0": 283.2, "r_x1": 480.6, "r_y1": 283.2, "r_x2": 480.6, "r_y2": 275.1, "r_x3": 188.1, "r_y3": 275.1, "coord_origin": "TOPLEFT" }, "text": "HPO performed in OTSL and HTML representation on the same", "orig": "HPO performed in OTSL and HTML representation on the same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 294.2, "r_x1": 480.6, "r_y1": 294.2, "r_x2": 480.6, "r_y2": 286.1, "r_x3": 134.8, "r_y3": 286.1, "coord_origin": "TOPLEFT" }, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 305.1, "r_x1": 480.6, "r_y1": 305.1, "r_x2": 480.6, "r_y2": 297.1, "r_x3": 134.8, "r_y3": 297.1, "coord_origin": "TOPLEFT" }, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 316.1, "r_x1": 480.6, "r_y1": 316.1, "r_x2": 480.6, "r_y2": 308.0, "r_x3": 134.8, "r_y3": 308.0, "coord_origin": "TOPLEFT" }, "text": "smaller models trained on OTSL perform better, especially in recognizing complex", "orig": "smaller models trained on OTSL perform better, especially in recognizing complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 327.0, "r_x1": 480.6, "r_y1": 327.0, "r_x2": 480.6, "r_y2": 319.0, "r_x3": 134.8, "r_y3": 319.0, "coord_origin": "TOPLEFT" }, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 1. HPO performed in OTSL and HTML representation on the same transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Effects of reducing the # of layers in encoder and decoder stages of the model show that smaller models trained on OTSL perform better, especially in recognizing complex table structures, and maintain a much higher mAP score than the HTML counterpart." }, { "label": "table", "id": 0, "page_no": 8, "cluster": { "id": 0, "label": "table", "bbox": { "l": 139.7, "t": 337.6, "r": 475.0, "b": 469.5, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.4, "r_y0": 349.8, "r_x1": 168.0, "r_y1": 349.8, "r_x2": 168.0, "r_y2": 341.7, "r_x3": 160.4, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.6, "r_y0": 362.8, "r_x1": 183.8, "r_y1": 362.8, "r_x2": 183.8, "r_y2": 354.7, "r_x3": 144.6, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.0, "r_y0": 349.8, "r_x1": 215.7, "r_y1": 349.8, "r_x2": 215.7, "r_y2": 341.7, "r_x3": 208.0, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.2, "r_y0": 362.8, "r_x1": 231.4, "r_y1": 362.8, "r_x2": 231.4, "r_y2": 354.7, "r_x3": 192.2, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.3, "r_x1": 278.3, "r_y1": 355.3, "r_x2": 278.3, "r_y2": 347.2, "r_x3": 239.8, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.7, "r_y0": 349.8, "r_x1": 348.3, "r_y1": 349.8, "r_x2": 348.3, "r_y2": 341.7, "r_x3": 324.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 349.8, "r_x1": 417.1, "r_y1": 349.8, "r_x2": 417.1, "r_y2": 341.7, "r_x3": 396.3, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.9, "r_y0": 360.8, "r_x1": 418.5, "r_y1": 360.8, "r_x2": 418.5, "r_y2": 352.7, "r_x3": 394.9, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.8, "r_y0": 349.8, "r_x1": 467.1, "r_y1": 349.8, "r_x2": 467.1, "r_y2": 341.7, "r_x3": 430.8, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.1, "r_y0": 360.8, "r_x1": 470.8, "r_y1": 360.8, "r_x2": 470.8, "r_y2": 352.7, "r_x3": 427.1, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.7, "r_y0": 362.8, "r_x1": 312.3, "r_y1": 362.8, "r_x2": 312.3, "r_y2": 354.7, "r_x3": 286.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.8, "r_x1": 353.7, "r_y1": 362.8, "r_x2": 353.7, "r_y2": 354.7, "r_x3": 320.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.3, "r_y0": 362.8, "r_x1": 379.0, "r_y1": 362.8, "r_x2": 379.0, "r_y2": 354.7, "r_x3": 369.3, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 381.6, "r_x1": 166.5, "r_y1": 381.6, "r_x2": 166.5, "r_y2": 373.5, "r_x3": 161.9, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 381.6, "r_x1": 214.1, "r_y1": 381.6, "r_x2": 214.1, "r_y2": 373.5, "r_x3": 209.5, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 376.1, "r_x1": 271.4, "r_y1": 376.1, "r_x2": 271.4, "r_y2": 368.0, "r_x3": 246.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 376.1, "r_x1": 310.0, "r_y1": 376.1, "r_x2": 310.0, "r_y2": 368.0, "r_x3": 289.0, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 376.1, "r_x1": 347.7, "r_y1": 376.1, "r_x2": 347.7, "r_y2": 368.0, "r_x3": 326.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 376.1, "r_x1": 384.7, "r_y1": 376.1, "r_x2": 384.7, "r_y2": 368.0, "r_x3": 363.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.3, "r_y0": 375.9, "r_x1": 416.1, "r_y1": 375.9, "r_x2": 416.1, "r_y2": 368.0, "r_x3": 397.3, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 375.9, "r_x1": 458.4, "r_y1": 375.9, "r_x2": 458.4, "r_y2": 368.0, "r_x3": 439.5, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 389.1, "r_x1": 272.9, "r_y1": 389.1, "r_x2": 272.9, "r_y2": 381.0, "r_x3": 245.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 389.1, "r_x1": 310.0, "r_y1": 389.1, "r_x2": 310.0, "r_y2": 381.0, "r_x3": 289.0, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 389.1, "r_x1": 347.7, "r_y1": 389.1, "r_x2": 347.7, "r_y2": 381.0, "r_x3": 326.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 389.1, "r_x1": 384.7, "r_y1": 389.1, "r_x2": 384.7, "r_y2": 381.0, "r_x3": 363.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 389.1, "r_x1": 417.2, "r_y1": 389.1, "r_x2": 417.2, "r_y2": 381.0, "r_x3": 396.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 389.1, "r_x1": 457.1, "r_y1": 389.1, "r_x2": 457.1, "r_y2": 381.0, "r_x3": 440.8, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 407.9, "r_x1": 166.5, "r_y1": 407.9, "r_x2": 166.5, "r_y2": 399.8, "r_x3": 161.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 407.9, "r_x1": 214.1, "r_y1": 407.9, "r_x2": 214.1, "r_y2": 399.8, "r_x3": 209.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 402.4, "r_x1": 271.4, "r_y1": 402.4, "r_x2": 271.4, "r_y2": 394.3, "r_x3": 246.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 402.4, "r_x1": 310.0, "r_y1": 402.4, "r_x2": 310.0, "r_y2": 394.3, "r_x3": 289.0, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 402.4, "r_x1": 347.7, "r_y1": 402.4, "r_x2": 347.7, "r_y2": 394.3, "r_x3": 326.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 402.4, "r_x1": 384.7, "r_y1": 402.4, "r_x2": 384.7, "r_y2": 394.3, "r_x3": 363.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 402.2, "r_x1": 418.8, "r_y1": 402.2, "r_x2": 418.8, "r_y2": 394.3, "r_x3": 394.6, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 402.2, "r_x1": 458.4, "r_y1": 402.2, "r_x2": 458.4, "r_y2": 394.3, "r_x3": 439.5, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 415.4, "r_x1": 272.9, "r_y1": 415.4, "r_x2": 272.9, "r_y2": 407.3, "r_x3": 245.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 415.4, "r_x1": 310.0, "r_y1": 415.4, "r_x2": 310.0, "r_y2": 407.3, "r_x3": 289.0, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 415.4, "r_x1": 347.7, "r_y1": 415.4, "r_x2": 347.7, "r_y2": 407.3, "r_x3": 326.7, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 415.2, "r_x1": 386.2, "r_y1": 415.2, "r_x2": 386.2, "r_y2": 407.2, "r_x3": 362.1, "r_y3": 407.2, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 415.4, "r_x1": 417.2, "r_y1": 415.4, "r_x2": 417.2, "r_y2": 407.3, "r_x3": 396.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 415.4, "r_x1": 457.1, "r_y1": 415.4, "r_x2": 457.1, "r_y2": 407.3, "r_x3": 440.8, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 434.2, "r_x1": 166.5, "r_y1": 434.2, "r_x2": 166.5, "r_y2": 426.1, "r_x3": 161.9, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 434.2, "r_x1": 214.1, "r_y1": 434.2, "r_x2": 214.1, "r_y2": 426.1, "r_x3": 209.5, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 428.7, "r_x1": 271.4, "r_y1": 428.7, "r_x2": 271.4, "r_y2": 420.6, "r_x3": 246.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 428.7, "r_x1": 310.0, "r_y1": 428.7, "r_x2": 310.0, "r_y2": 420.6, "r_x3": 289.0, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 428.7, "r_x1": 347.7, "r_y1": 428.7, "r_x2": 347.7, "r_y2": 420.6, "r_x3": 326.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 428.7, "r_x1": 384.7, "r_y1": 428.7, "r_x2": 384.7, "r_y2": 420.6, "r_x3": 363.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 428.5, "r_x1": 418.8, "r_y1": 428.5, "r_x2": 418.8, "r_y2": 420.6, "r_x3": 394.6, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 428.5, "r_x1": 458.4, "r_y1": 428.5, "r_x2": 458.4, "r_y2": 420.6, "r_x3": 439.5, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 441.7, "r_x1": 272.9, "r_y1": 441.7, "r_x2": 272.9, "r_y2": 433.6, "r_x3": 245.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 441.7, "r_x1": 310.0, "r_y1": 441.7, "r_x2": 310.0, "r_y2": 433.6, "r_x3": 289.0, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 441.7, "r_x1": 347.7, "r_y1": 441.7, "r_x2": 347.7, "r_y2": 433.6, "r_x3": 326.7, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 441.5, "r_x1": 386.2, "r_y1": 441.5, "r_x2": 386.2, "r_y2": 433.5, "r_x3": 362.1, "r_y3": 433.5, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 441.7, "r_x1": 417.2, "r_y1": 441.7, "r_x2": 417.2, "r_y2": 433.6, "r_x3": 396.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 441.7, "r_x1": 457.1, "r_y1": 441.7, "r_x2": 457.1, "r_y2": 433.6, "r_x3": 440.8, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 460.5, "r_x1": 166.5, "r_y1": 460.5, "r_x2": 166.5, "r_y2": 452.4, "r_x3": 161.9, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 460.5, "r_x1": 214.1, "r_y1": 460.5, "r_x2": 214.1, "r_y2": 452.4, "r_x3": 209.5, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 455.0, "r_x1": 271.4, "r_y1": 455.0, "r_x2": 271.4, "r_y2": 446.9, "r_x3": 246.7, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 455.0, "r_x1": 310.0, "r_y1": 455.0, "r_x2": 310.0, "r_y2": 446.9, "r_x3": 289.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.0, "r_y0": 455.0, "r_x1": 345.4, "r_y1": 455.0, "r_x2": 345.4, "r_y2": 446.9, "r_x3": 329.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 454.8, "r_x1": 386.2, "r_y1": 454.8, "r_x2": 386.2, "r_y2": 446.9, "r_x3": 362.1, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 454.8, "r_x1": 418.8, "r_y1": 454.8, "r_x2": 418.8, "r_y2": 446.9, "r_x3": 394.6, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 454.8, "r_x1": 458.4, "r_y1": 454.8, "r_x2": 458.4, "r_y2": 446.9, "r_x3": 439.5, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 468.0, "r_x1": 272.9, "r_y1": 468.0, "r_x2": 272.9, "r_y2": 459.9, "r_x3": 245.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 468.0, "r_x1": 310.0, "r_y1": 468.0, "r_x2": 310.0, "r_y2": 459.9, "r_x3": 289.0, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 468.0, "r_x1": 347.7, "r_y1": 468.0, "r_x2": 347.7, "r_y2": 459.9, "r_x3": 326.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 468.0, "r_x1": 384.7, "r_y1": 468.0, "r_x2": 384.7, "r_y2": 459.9, "r_x3": 363.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 468.0, "r_x1": 417.2, "r_y1": 468.0, "r_x2": 417.2, "r_y2": 459.9, "r_x3": 396.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.7, "r_y0": 468.0, "r_x1": 451.3, "r_y1": 468.0, "r_x2": 451.3, "r_y2": 459.9, "r_x3": 446.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 160.4, "t": 341.7, "r": 168.0, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.4, "r_y0": 349.8, "r_x1": 168.0, "r_y1": 349.8, "r_x2": 168.0, "r_y2": 341.7, "r_x3": 160.4, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 144.6, "t": 354.7, "r": 183.8, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.6, "r_y0": 362.8, "r_x1": 183.8, "r_y1": 362.8, "r_x2": 183.8, "r_y2": 354.7, "r_x3": 144.6, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 208.0, "t": 341.7, "r": 215.7, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.0, "r_y0": 349.8, "r_x1": 215.7, "r_y1": 349.8, "r_x2": 215.7, "r_y2": 341.7, "r_x3": 208.0, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 192.2, "t": 354.7, "r": 231.4, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.2, "r_y0": 362.8, "r_x1": 231.4, "r_y1": 362.8, "r_x2": 231.4, "r_y2": 354.7, "r_x3": 192.2, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 239.8, "t": 347.2, "r": 278.3, "b": 355.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.3, "r_x1": 278.3, "r_y1": 355.3, "r_x2": 278.3, "r_y2": 347.2, "r_x3": 239.8, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 324.7, "t": 341.7, "r": 348.3, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.7, "r_y0": 349.8, "r_x1": 348.3, "r_y1": 349.8, "r_x2": 348.3, "r_y2": 341.7, "r_x3": 324.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 396.3, "t": 341.7, "r": 417.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 349.8, "r_x1": 417.1, "r_y1": 349.8, "r_x2": 417.1, "r_y2": 341.7, "r_x3": 396.3, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 394.9, "t": 352.7, "r": 418.5, "b": 360.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.9, "r_y0": 360.8, "r_x1": 418.5, "r_y1": 360.8, "r_x2": 418.5, "r_y2": 352.7, "r_x3": 394.9, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 430.8, "t": 341.7, "r": 467.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.8, "r_y0": 349.8, "r_x1": 467.1, "r_y1": 349.8, "r_x2": 467.1, "r_y2": 341.7, "r_x3": 430.8, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 427.1, "t": 352.7, "r": 470.8, "b": 360.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.1, "r_y0": 360.8, "r_x1": 470.8, "r_y1": 360.8, "r_x2": 470.8, "r_y2": 352.7, "r_x3": 427.1, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 286.7, "t": 354.7, "r": 312.3, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.7, "r_y0": 362.8, "r_x1": 312.3, "r_y1": 362.8, "r_x2": 312.3, "r_y2": 354.7, "r_x3": 286.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 320.7, "t": 354.7, "r": 353.7, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.8, "r_x1": 353.7, "r_y1": 362.8, "r_x2": 353.7, "r_y2": 354.7, "r_x3": 320.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 369.3, "t": 354.7, "r": 379.0, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.3, "r_y0": 362.8, "r_x1": 379.0, "r_y1": 362.8, "r_x2": 379.0, "r_y2": 354.7, "r_x3": 369.3, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 161.9, "t": 373.5, "r": 166.5, "b": 381.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 381.6, "r_x1": 166.5, "r_y1": 381.6, "r_x2": 166.5, "r_y2": 373.5, "r_x3": 161.9, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 209.5, "t": 373.5, "r": 214.1, "b": 381.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 381.6, "r_x1": 214.1, "r_y1": 381.6, "r_x2": 214.1, "r_y2": 373.5, "r_x3": 209.5, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 246.7, "t": 368.0, "r": 271.4, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 376.1, "r_x1": 271.4, "r_y1": 376.1, "r_x2": 271.4, "r_y2": 368.0, "r_x3": 246.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 289.0, "t": 368.0, "r": 310.0, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 376.1, "r_x1": 310.0, "r_y1": 376.1, "r_x2": 310.0, "r_y2": 368.0, "r_x3": 289.0, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 326.7, "t": 368.0, "r": 347.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 376.1, "r_x1": 347.7, "r_y1": 376.1, "r_x2": 347.7, "r_y2": 368.0, "r_x3": 326.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 363.7, "t": 368.0, "r": 384.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 376.1, "r_x1": 384.7, "r_y1": 376.1, "r_x2": 384.7, "r_y2": 368.0, "r_x3": 363.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 397.3, "t": 368.0, "r": 416.1, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.3, "r_y0": 375.9, "r_x1": 416.1, "r_y1": 375.9, "r_x2": 416.1, "r_y2": 368.0, "r_x3": 397.3, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 439.5, "t": 368.0, "r": 458.4, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 375.9, "r_x1": 458.4, "r_y1": 375.9, "r_x2": 458.4, "r_y2": 368.0, "r_x3": 439.5, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 245.2, "t": 381.0, "r": 272.9, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 389.1, "r_x1": 272.9, "r_y1": 389.1, "r_x2": 272.9, "r_y2": 381.0, "r_x3": 245.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 289.0, "t": 381.0, "r": 310.0, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 389.1, "r_x1": 310.0, "r_y1": 389.1, "r_x2": 310.0, "r_y2": 381.0, "r_x3": 289.0, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 326.7, "t": 381.0, "r": 347.7, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 389.1, "r_x1": 347.7, "r_y1": 389.1, "r_x2": 347.7, "r_y2": 381.0, "r_x3": 326.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 363.7, "t": 381.0, "r": 384.7, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 389.1, "r_x1": 384.7, "r_y1": 389.1, "r_x2": 384.7, "r_y2": 381.0, "r_x3": 363.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.2, "t": 381.0, "r": 417.2, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 389.1, "r_x1": 417.2, "r_y1": 389.1, "r_x2": 417.2, "r_y2": 381.0, "r_x3": 396.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 440.8, "t": 381.0, "r": 457.1, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 389.1, "r_x1": 457.1, "r_y1": 389.1, "r_x2": 457.1, "r_y2": 381.0, "r_x3": 440.8, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 161.9, "t": 399.8, "r": 166.5, "b": 407.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 407.9, "r_x1": 166.5, "r_y1": 407.9, "r_x2": 166.5, "r_y2": 399.8, "r_x3": 161.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 209.5, "t": 399.8, "r": 214.1, "b": 407.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 407.9, "r_x1": 214.1, "r_y1": 407.9, "r_x2": 214.1, "r_y2": 399.8, "r_x3": 209.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 246.7, "t": 394.3, "r": 271.4, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 402.4, "r_x1": 271.4, "r_y1": 402.4, "r_x2": 271.4, "r_y2": 394.3, "r_x3": 246.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 289.0, "t": 394.3, "r": 310.0, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 402.4, "r_x1": 310.0, "r_y1": 402.4, "r_x2": 310.0, "r_y2": 394.3, "r_x3": 289.0, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 326.7, "t": 394.3, "r": 347.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 402.4, "r_x1": 347.7, "r_y1": 402.4, "r_x2": 347.7, "r_y2": 394.3, "r_x3": 326.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 363.7, "t": 394.3, "r": 384.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 402.4, "r_x1": 384.7, "r_y1": 402.4, "r_x2": 384.7, "r_y2": 394.3, "r_x3": 363.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 394.6, "t": 394.3, "r": 418.8, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 402.2, "r_x1": 418.8, "r_y1": 402.2, "r_x2": 418.8, "r_y2": 394.3, "r_x3": 394.6, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 439.5, "t": 394.3, "r": 458.4, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 402.2, "r_x1": 458.4, "r_y1": 402.2, "r_x2": 458.4, "r_y2": 394.3, "r_x3": 439.5, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 245.2, "t": 407.3, "r": 272.9, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 415.4, "r_x1": 272.9, "r_y1": 415.4, "r_x2": 272.9, "r_y2": 407.3, "r_x3": 245.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 289.0, "t": 407.3, "r": 310.0, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 415.4, "r_x1": 310.0, "r_y1": 415.4, "r_x2": 310.0, "r_y2": 407.3, "r_x3": 289.0, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 326.7, "t": 407.3, "r": 347.7, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 415.4, "r_x1": 347.7, "r_y1": 415.4, "r_x2": 347.7, "r_y2": 407.3, "r_x3": 326.7, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 362.1, "t": 407.2, "r": 386.2, "b": 415.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 415.2, "r_x1": 386.2, "r_y1": 415.2, "r_x2": 386.2, "r_y2": 407.2, "r_x3": 362.1, "r_y3": 407.2, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 396.2, "t": 407.3, "r": 417.2, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 415.4, "r_x1": 417.2, "r_y1": 415.4, "r_x2": 417.2, "r_y2": 407.3, "r_x3": 396.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 440.8, "t": 407.3, "r": 457.1, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 415.4, "r_x1": 457.1, "r_y1": 415.4, "r_x2": 457.1, "r_y2": 407.3, "r_x3": 440.8, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 161.9, "t": 426.1, "r": 166.5, "b": 434.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 434.2, "r_x1": 166.5, "r_y1": 434.2, "r_x2": 166.5, "r_y2": 426.1, "r_x3": 161.9, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 209.5, "t": 426.1, "r": 214.1, "b": 434.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 434.2, "r_x1": 214.1, "r_y1": 434.2, "r_x2": 214.1, "r_y2": 426.1, "r_x3": 209.5, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 246.7, "t": 420.6, "r": 271.4, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 428.7, "r_x1": 271.4, "r_y1": 428.7, "r_x2": 271.4, "r_y2": 420.6, "r_x3": 246.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 289.0, "t": 420.6, "r": 310.0, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 428.7, "r_x1": 310.0, "r_y1": 428.7, "r_x2": 310.0, "r_y2": 420.6, "r_x3": 289.0, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.7, "t": 420.6, "r": 347.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 428.7, "r_x1": 347.7, "r_y1": 428.7, "r_x2": 347.7, "r_y2": 420.6, "r_x3": 326.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 363.7, "t": 420.6, "r": 384.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 428.7, "r_x1": 384.7, "r_y1": 428.7, "r_x2": 384.7, "r_y2": 420.6, "r_x3": 363.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 394.6, "t": 420.6, "r": 418.8, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 428.5, "r_x1": 418.8, "r_y1": 428.5, "r_x2": 418.8, "r_y2": 420.6, "r_x3": 394.6, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 439.5, "t": 420.6, "r": 458.4, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 428.5, "r_x1": 458.4, "r_y1": 428.5, "r_x2": 458.4, "r_y2": 420.6, "r_x3": 439.5, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 245.2, "t": 433.6, "r": 272.9, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 441.7, "r_x1": 272.9, "r_y1": 441.7, "r_x2": 272.9, "r_y2": 433.6, "r_x3": 245.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 289.0, "t": 433.6, "r": 310.0, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 441.7, "r_x1": 310.0, "r_y1": 441.7, "r_x2": 310.0, "r_y2": 433.6, "r_x3": 289.0, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 326.7, "t": 433.6, "r": 347.7, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 441.7, "r_x1": 347.7, "r_y1": 441.7, "r_x2": 347.7, "r_y2": 433.6, "r_x3": 326.7, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 362.1, "t": 433.5, "r": 386.2, "b": 441.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 441.5, "r_x1": 386.2, "r_y1": 441.5, "r_x2": 386.2, "r_y2": 433.5, "r_x3": 362.1, "r_y3": 433.5, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 396.2, "t": 433.6, "r": 417.2, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 441.7, "r_x1": 417.2, "r_y1": 441.7, "r_x2": 417.2, "r_y2": 433.6, "r_x3": 396.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 440.8, "t": 433.6, "r": 457.1, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 441.7, "r_x1": 457.1, "r_y1": 441.7, "r_x2": 457.1, "r_y2": 433.6, "r_x3": 440.8, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 161.9, "t": 452.4, "r": 166.5, "b": 460.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 460.5, "r_x1": 166.5, "r_y1": 460.5, "r_x2": 166.5, "r_y2": 452.4, "r_x3": 161.9, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 209.5, "t": 452.4, "r": 214.1, "b": 460.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 460.5, "r_x1": 214.1, "r_y1": 460.5, "r_x2": 214.1, "r_y2": 452.4, "r_x3": 209.5, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 246.7, "t": 446.9, "r": 271.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 455.0, "r_x1": 271.4, "r_y1": 455.0, "r_x2": 271.4, "r_y2": 446.9, "r_x3": 246.7, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 289.0, "t": 446.9, "r": 310.0, "b": 455.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 455.0, "r_x1": 310.0, "r_y1": 455.0, "r_x2": 310.0, "r_y2": 446.9, "r_x3": 289.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 329.0, "t": 446.9, "r": 345.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.0, "r_y0": 455.0, "r_x1": 345.4, "r_y1": 455.0, "r_x2": 345.4, "r_y2": 446.9, "r_x3": 329.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 362.1, "t": 446.9, "r": 386.2, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 454.8, "r_x1": 386.2, "r_y1": 454.8, "r_x2": 386.2, "r_y2": 446.9, "r_x3": 362.1, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.6, "t": 446.9, "r": 418.8, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 454.8, "r_x1": 418.8, "r_y1": 454.8, "r_x2": 418.8, "r_y2": 446.9, "r_x3": 394.6, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 439.5, "t": 446.9, "r": 458.4, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 454.8, "r_x1": 458.4, "r_y1": 454.8, "r_x2": 458.4, "r_y2": 446.9, "r_x3": 439.5, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 245.2, "t": 459.9, "r": 272.9, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 468.0, "r_x1": 272.9, "r_y1": 468.0, "r_x2": 272.9, "r_y2": 459.9, "r_x3": 245.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.0, "t": 459.9, "r": 310.0, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 468.0, "r_x1": 310.0, "r_y1": 468.0, "r_x2": 310.0, "r_y2": 459.9, "r_x3": 289.0, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 326.7, "t": 459.9, "r": 347.7, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 468.0, "r_x1": 347.7, "r_y1": 468.0, "r_x2": 347.7, "r_y2": 459.9, "r_x3": 326.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 363.7, "t": 459.9, "r": 384.7, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 468.0, "r_x1": 384.7, "r_y1": 468.0, "r_x2": 384.7, "r_y2": 459.9, "r_x3": 363.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 396.2, "t": 459.9, "r": 417.2, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 468.0, "r_x1": 417.2, "r_y1": 468.0, "r_x2": 417.2, "r_y2": 459.9, "r_x3": 396.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 446.7, "t": 459.9, "r": 451.3, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.7, "r_y0": 468.0, "r_x1": 451.3, "r_y1": 468.0, "r_x2": 451.3, "r_y2": 459.9, "r_x3": 446.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 6, "num_cols": 8, "table_cells": [ { "bbox": { "l": 160.4, "t": 341.7, "r": 168.0, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "# enc-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 208.0, "t": 341.7, "r": 215.7, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "# dec-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 239.8, "t": 347.2, "r": 278.3, "b": 355.3, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 324.7, "t": 341.7, "r": 348.3, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 6, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 396.3, "t": 341.7, "r": 417.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 394.9, "t": 352.7, "r": 418.5, "b": 360.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 430.8, "t": 341.7, "r": 467.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "Inference", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.1, "t": 352.7, "r": 470.8, "b": 360.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 286.7, "t": 354.7, "r": 312.3, "b": 362.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 320.7, "t": 354.7, "r": 353.7, "b": 362.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 369.3, "t": 354.7, "r": 379.0, "b": 362.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 161.9, "t": 373.5, "r": 166.5, "b": 381.6, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.5, "t": 373.5, "r": 214.1, "b": 381.6, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.7, "t": 368.0, "r": 271.4, "b": 376.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.0, "t": 368.0, "r": 310.0, "b": 376.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.7, "t": 368.0, "r": 347.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.7, "t": 368.0, "r": 384.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 397.3, "t": 368.0, "r": 416.1, "b": 375.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.5, "t": 368.0, "r": 458.4, "b": 375.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.9, "t": 399.8, "r": 166.5, "b": 407.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.5, "t": 399.8, "r": 214.1, "b": 407.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.7, "t": 394.3, "r": 271.4, "b": 402.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.0, "t": 394.3, "r": 310.0, "b": 402.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.938 0.952", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.7, "t": 394.3, "r": 347.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.904 0.909", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.7, "t": 394.3, "r": 384.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.927 0.938", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.6, "t": 394.3, "r": 418.8, "b": 402.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.853 0.843", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.5, "t": 394.3, "r": 458.4, "b": 402.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.97 3.77", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.9, "t": 426.1, "r": 166.5, "b": 434.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.5, "t": 426.1, "r": 214.1, "b": 434.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.7, "t": 420.6, "r": 271.4, "b": 428.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.0, "t": 420.6, "r": 310.0, "b": 428.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.923 0.945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.7, "t": 420.6, "r": 347.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.897 0.901", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.7, "t": 420.6, "r": 384.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.915 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.6, "t": 420.6, "r": 418.8, "b": 428.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.859 0.834", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.5, "t": 420.6, "r": 458.4, "b": 428.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.91 3.81", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.9, "t": 452.4, "r": 166.5, "b": 460.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.5, "t": 452.4, "r": 214.1, "b": 460.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.7, "t": 446.9, "r": 271.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.0, "t": 446.9, "r": 310.0, "b": 455.0, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.952 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 329.0, "t": 446.9, "r": 345.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.92 0.903", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 362.1, "t": 446.9, "r": 386.2, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.942 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.6, "t": 446.9, "r": 418.8, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.857 0.824", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.5, "t": 446.9, "r": 458.4, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.22 2", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "section_header", "id": 5, "page_no": 8, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.8, "t": 508.2, "r": 264.4, "b": 517.0, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 517.0, "r_x1": 149.4, "r_y1": 517.0, "r_x2": 149.4, "r_y2": 508.2, "r_x3": 134.8, "r_y3": 508.2, "coord_origin": "TOPLEFT" }, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 517.0, "r_x1": 264.4, "r_y1": 517.0, "r_x2": 264.4, "r_y2": 508.2, "r_x3": 160.9, "r_y3": 508.2, "coord_origin": "TOPLEFT" }, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.2 Quantitative Results" }, { "label": "text", "id": 1, "page_no": 8, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 524.6, "r": 480.6, "b": 617.0, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.6, "r_x3": 134.8, "r_y3": 524.6, "coord_origin": "TOPLEFT" }, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 480.6, "r_y1": 581.2, "r_x2": 480.6, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 206.8, "r_y1": 617.0, "r_x2": 206.8, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We picked the model parameter configuration that produced the best prediction quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently trained and evaluated it on three publicly available data sets: PubTabNet (395k samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples). Performance results are presented in Table. 2. It is clearly evident that the model trained on OTSL outperforms HTML across the board, keeping high TEDs and mAP scores even on difficult financial tables (FinTabNet) that contain sparse and large tables." }, { "label": "text", "id": 2, "page_no": 8, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 620.2, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 149.7, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "Additionally, the results show that OTSL has an advantage over HTML", "orig": "Additionally, the results show that OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 405.8, "r_y1": 664.9, "r_x2": 405.8, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Additionally, the results show that OTSL has an advantage over HTML when applied on a bigger data set like PubTables-1M and achieves significantly improved scores. Finally, OTSL achieves faster inference due to fewer decoding steps which is a result of the reduced sequence representation." } ], "body": [ { "label": "text", "id": 4, "page_no": 8, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.8, "t": 118.9, "r": 480.6, "b": 151.6, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 118.9, "r_x3": 134.8, "r_y3": 118.9, "coord_origin": "TOPLEFT" }, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 139.7, "r_x1": 480.6, "r_y1": 139.7, "r_x2": 480.6, "r_y2": 130.9, "r_x3": 134.8, "r_y3": 130.9, "coord_origin": "TOPLEFT" }, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 151.6, "r_x1": 210.8, "r_y1": 151.6, "r_x2": 210.8, "r_y2": 142.8, "r_x3": 134.8, "r_y3": 142.8, "coord_origin": "TOPLEFT" }, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "order to compute the TED score. Inference timing results for all experiments were obtained from the same machine on a single core with AMD EPYC 7763 CPU @2.45 GHz." }, { "label": "section_header", "id": 6, "page_no": 8, "cluster": { "id": 6, "label": "section_header", "bbox": { "l": 134.8, "t": 169.2, "r": 318.4, "b": 178.0, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 178.0, "r_x1": 149.4, "r_y1": 178.0, "r_x2": 149.4, "r_y2": 169.2, "r_x3": 134.8, "r_y3": 169.2, "coord_origin": "TOPLEFT" }, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 178.0, "r_x1": 318.4, "r_y1": 178.0, "r_x2": 318.4, "r_y2": 169.2, "r_x3": 160.9, "r_y3": 169.2, "coord_origin": "TOPLEFT" }, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.1 Hyper Parameter Optimization" }, { "label": "text", "id": 3, "page_no": 8, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.8, "t": 185.6, "r": 480.6, "b": 254.2, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 194.4, "r_x1": 480.6, "r_y1": 194.4, "r_x2": 480.6, "r_y2": 185.6, "r_x3": 134.8, "r_y3": 185.6, "coord_origin": "TOPLEFT" }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 206.3, "r_x1": 480.6, "r_y1": 206.3, "r_x2": 480.6, "r_y2": 197.5, "r_x3": 134.8, "r_y3": 197.5, "coord_origin": "TOPLEFT" }, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 218.3, "r_x1": 480.6, "r_y1": 218.3, "r_x2": 480.6, "r_y2": 209.5, "r_x3": 134.8, "r_y3": 209.5, "coord_origin": "TOPLEFT" }, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 230.2, "r_x1": 480.6, "r_y1": 230.2, "r_x2": 480.6, "r_y2": 221.5, "r_x3": 134.8, "r_y3": 221.5, "coord_origin": "TOPLEFT" }, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 242.2, "r_x1": 440.9, "r_y1": 242.2, "r_x2": 440.9, "r_y2": 233.4, "r_x3": 134.8, "r_y3": 233.4, "coord_origin": "TOPLEFT" }, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.9, "r_y0": 242.2, "r_x1": 480.6, "r_y1": 242.2, "r_x2": 480.6, "r_y2": 233.4, "r_x3": 444.9, "r_y3": 233.4, "coord_origin": "TOPLEFT" }, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 254.2, "r_x1": 145.2, "r_y1": 254.2, "r_x2": 145.2, "r_y2": 245.4, "r_x3": 134.8, "r_y3": 245.4, "coord_origin": "TOPLEFT" }, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.1, "r_y0": 254.2, "r_x1": 311.2, "r_y1": 254.2, "r_x2": 311.2, "r_y2": 245.4, "r_x3": 149.1, "r_y3": 245.4, "coord_origin": "TOPLEFT" }, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a highly diverse set of tables. Also we report TED scores separately for simple and complex tables (tables with cell spans). Results are presented in Table. 1. It is evident that with OTSL, our model achieves the same TED score and slightly better mAP scores in comparison to HTML. However OTSL yields a 2x speed up in the inference runtime over HTML." }, { "label": "caption", "id": 7, "page_no": 8, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 134.8, "t": 275.1, "r": 480.6, "b": 327.0, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 283.0, "r_x1": 160.1, "r_y1": 283.0, "r_x2": 160.1, "r_y2": 275.1, "r_x3": 134.8, "r_y3": 275.1, "coord_origin": "TOPLEFT" }, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.3, "r_y0": 283.0, "r_x1": 175.6, "r_y1": 283.0, "r_x2": 175.6, "r_y2": 275.1, "r_x3": 167.3, "r_y3": 275.1, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.1, "r_y0": 283.2, "r_x1": 480.6, "r_y1": 283.2, "r_x2": 480.6, "r_y2": 275.1, "r_x3": 188.1, "r_y3": 275.1, "coord_origin": "TOPLEFT" }, "text": "HPO performed in OTSL and HTML representation on the same", "orig": "HPO performed in OTSL and HTML representation on the same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 294.2, "r_x1": 480.6, "r_y1": 294.2, "r_x2": 480.6, "r_y2": 286.1, "r_x3": 134.8, "r_y3": 286.1, "coord_origin": "TOPLEFT" }, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 305.1, "r_x1": 480.6, "r_y1": 305.1, "r_x2": 480.6, "r_y2": 297.1, "r_x3": 134.8, "r_y3": 297.1, "coord_origin": "TOPLEFT" }, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 316.1, "r_x1": 480.6, "r_y1": 316.1, "r_x2": 480.6, "r_y2": 308.0, "r_x3": 134.8, "r_y3": 308.0, "coord_origin": "TOPLEFT" }, "text": "smaller models trained on OTSL perform better, especially in recognizing complex", "orig": "smaller models trained on OTSL perform better, especially in recognizing complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 327.0, "r_x1": 480.6, "r_y1": 327.0, "r_x2": 480.6, "r_y2": 319.0, "r_x3": 134.8, "r_y3": 319.0, "coord_origin": "TOPLEFT" }, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 1. HPO performed in OTSL and HTML representation on the same transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Effects of reducing the # of layers in encoder and decoder stages of the model show that smaller models trained on OTSL perform better, especially in recognizing complex table structures, and maintain a much higher mAP score than the HTML counterpart." }, { "label": "table", "id": 0, "page_no": 8, "cluster": { "id": 0, "label": "table", "bbox": { "l": 139.7, "t": 337.6, "r": 475.0, "b": 469.5, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.4, "r_y0": 349.8, "r_x1": 168.0, "r_y1": 349.8, "r_x2": 168.0, "r_y2": 341.7, "r_x3": 160.4, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.6, "r_y0": 362.8, "r_x1": 183.8, "r_y1": 362.8, "r_x2": 183.8, "r_y2": 354.7, "r_x3": 144.6, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.0, "r_y0": 349.8, "r_x1": 215.7, "r_y1": 349.8, "r_x2": 215.7, "r_y2": 341.7, "r_x3": 208.0, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.2, "r_y0": 362.8, "r_x1": 231.4, "r_y1": 362.8, "r_x2": 231.4, "r_y2": 354.7, "r_x3": 192.2, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.3, "r_x1": 278.3, "r_y1": 355.3, "r_x2": 278.3, "r_y2": 347.2, "r_x3": 239.8, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.7, "r_y0": 349.8, "r_x1": 348.3, "r_y1": 349.8, "r_x2": 348.3, "r_y2": 341.7, "r_x3": 324.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 349.8, "r_x1": 417.1, "r_y1": 349.8, "r_x2": 417.1, "r_y2": 341.7, "r_x3": 396.3, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.9, "r_y0": 360.8, "r_x1": 418.5, "r_y1": 360.8, "r_x2": 418.5, "r_y2": 352.7, "r_x3": 394.9, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.8, "r_y0": 349.8, "r_x1": 467.1, "r_y1": 349.8, "r_x2": 467.1, "r_y2": 341.7, "r_x3": 430.8, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.1, "r_y0": 360.8, "r_x1": 470.8, "r_y1": 360.8, "r_x2": 470.8, "r_y2": 352.7, "r_x3": 427.1, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.7, "r_y0": 362.8, "r_x1": 312.3, "r_y1": 362.8, "r_x2": 312.3, "r_y2": 354.7, "r_x3": 286.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.8, "r_x1": 353.7, "r_y1": 362.8, "r_x2": 353.7, "r_y2": 354.7, "r_x3": 320.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.3, "r_y0": 362.8, "r_x1": 379.0, "r_y1": 362.8, "r_x2": 379.0, "r_y2": 354.7, "r_x3": 369.3, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 381.6, "r_x1": 166.5, "r_y1": 381.6, "r_x2": 166.5, "r_y2": 373.5, "r_x3": 161.9, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 381.6, "r_x1": 214.1, "r_y1": 381.6, "r_x2": 214.1, "r_y2": 373.5, "r_x3": 209.5, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 376.1, "r_x1": 271.4, "r_y1": 376.1, "r_x2": 271.4, "r_y2": 368.0, "r_x3": 246.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 376.1, "r_x1": 310.0, "r_y1": 376.1, "r_x2": 310.0, "r_y2": 368.0, "r_x3": 289.0, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 376.1, "r_x1": 347.7, "r_y1": 376.1, "r_x2": 347.7, "r_y2": 368.0, "r_x3": 326.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 376.1, "r_x1": 384.7, "r_y1": 376.1, "r_x2": 384.7, "r_y2": 368.0, "r_x3": 363.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.3, "r_y0": 375.9, "r_x1": 416.1, "r_y1": 375.9, "r_x2": 416.1, "r_y2": 368.0, "r_x3": 397.3, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 375.9, "r_x1": 458.4, "r_y1": 375.9, "r_x2": 458.4, "r_y2": 368.0, "r_x3": 439.5, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 389.1, "r_x1": 272.9, "r_y1": 389.1, "r_x2": 272.9, "r_y2": 381.0, "r_x3": 245.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 389.1, "r_x1": 310.0, "r_y1": 389.1, "r_x2": 310.0, "r_y2": 381.0, "r_x3": 289.0, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 389.1, "r_x1": 347.7, "r_y1": 389.1, "r_x2": 347.7, "r_y2": 381.0, "r_x3": 326.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 389.1, "r_x1": 384.7, "r_y1": 389.1, "r_x2": 384.7, "r_y2": 381.0, "r_x3": 363.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 389.1, "r_x1": 417.2, "r_y1": 389.1, "r_x2": 417.2, "r_y2": 381.0, "r_x3": 396.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 389.1, "r_x1": 457.1, "r_y1": 389.1, "r_x2": 457.1, "r_y2": 381.0, "r_x3": 440.8, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 407.9, "r_x1": 166.5, "r_y1": 407.9, "r_x2": 166.5, "r_y2": 399.8, "r_x3": 161.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 407.9, "r_x1": 214.1, "r_y1": 407.9, "r_x2": 214.1, "r_y2": 399.8, "r_x3": 209.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 402.4, "r_x1": 271.4, "r_y1": 402.4, "r_x2": 271.4, "r_y2": 394.3, "r_x3": 246.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 402.4, "r_x1": 310.0, "r_y1": 402.4, "r_x2": 310.0, "r_y2": 394.3, "r_x3": 289.0, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 402.4, "r_x1": 347.7, "r_y1": 402.4, "r_x2": 347.7, "r_y2": 394.3, "r_x3": 326.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 402.4, "r_x1": 384.7, "r_y1": 402.4, "r_x2": 384.7, "r_y2": 394.3, "r_x3": 363.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 402.2, "r_x1": 418.8, "r_y1": 402.2, "r_x2": 418.8, "r_y2": 394.3, "r_x3": 394.6, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 402.2, "r_x1": 458.4, "r_y1": 402.2, "r_x2": 458.4, "r_y2": 394.3, "r_x3": 439.5, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 415.4, "r_x1": 272.9, "r_y1": 415.4, "r_x2": 272.9, "r_y2": 407.3, "r_x3": 245.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 415.4, "r_x1": 310.0, "r_y1": 415.4, "r_x2": 310.0, "r_y2": 407.3, "r_x3": 289.0, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 415.4, "r_x1": 347.7, "r_y1": 415.4, "r_x2": 347.7, "r_y2": 407.3, "r_x3": 326.7, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 415.2, "r_x1": 386.2, "r_y1": 415.2, "r_x2": 386.2, "r_y2": 407.2, "r_x3": 362.1, "r_y3": 407.2, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 415.4, "r_x1": 417.2, "r_y1": 415.4, "r_x2": 417.2, "r_y2": 407.3, "r_x3": 396.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 415.4, "r_x1": 457.1, "r_y1": 415.4, "r_x2": 457.1, "r_y2": 407.3, "r_x3": 440.8, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 434.2, "r_x1": 166.5, "r_y1": 434.2, "r_x2": 166.5, "r_y2": 426.1, "r_x3": 161.9, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 434.2, "r_x1": 214.1, "r_y1": 434.2, "r_x2": 214.1, "r_y2": 426.1, "r_x3": 209.5, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 428.7, "r_x1": 271.4, "r_y1": 428.7, "r_x2": 271.4, "r_y2": 420.6, "r_x3": 246.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 428.7, "r_x1": 310.0, "r_y1": 428.7, "r_x2": 310.0, "r_y2": 420.6, "r_x3": 289.0, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 428.7, "r_x1": 347.7, "r_y1": 428.7, "r_x2": 347.7, "r_y2": 420.6, "r_x3": 326.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 428.7, "r_x1": 384.7, "r_y1": 428.7, "r_x2": 384.7, "r_y2": 420.6, "r_x3": 363.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 428.5, "r_x1": 418.8, "r_y1": 428.5, "r_x2": 418.8, "r_y2": 420.6, "r_x3": 394.6, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 428.5, "r_x1": 458.4, "r_y1": 428.5, "r_x2": 458.4, "r_y2": 420.6, "r_x3": 439.5, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 441.7, "r_x1": 272.9, "r_y1": 441.7, "r_x2": 272.9, "r_y2": 433.6, "r_x3": 245.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 441.7, "r_x1": 310.0, "r_y1": 441.7, "r_x2": 310.0, "r_y2": 433.6, "r_x3": 289.0, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 441.7, "r_x1": 347.7, "r_y1": 441.7, "r_x2": 347.7, "r_y2": 433.6, "r_x3": 326.7, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 441.5, "r_x1": 386.2, "r_y1": 441.5, "r_x2": 386.2, "r_y2": 433.5, "r_x3": 362.1, "r_y3": 433.5, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 441.7, "r_x1": 417.2, "r_y1": 441.7, "r_x2": 417.2, "r_y2": 433.6, "r_x3": 396.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 441.7, "r_x1": 457.1, "r_y1": 441.7, "r_x2": 457.1, "r_y2": 433.6, "r_x3": 440.8, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 460.5, "r_x1": 166.5, "r_y1": 460.5, "r_x2": 166.5, "r_y2": 452.4, "r_x3": 161.9, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 460.5, "r_x1": 214.1, "r_y1": 460.5, "r_x2": 214.1, "r_y2": 452.4, "r_x3": 209.5, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 455.0, "r_x1": 271.4, "r_y1": 455.0, "r_x2": 271.4, "r_y2": 446.9, "r_x3": 246.7, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 455.0, "r_x1": 310.0, "r_y1": 455.0, "r_x2": 310.0, "r_y2": 446.9, "r_x3": 289.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.0, "r_y0": 455.0, "r_x1": 345.4, "r_y1": 455.0, "r_x2": 345.4, "r_y2": 446.9, "r_x3": 329.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 454.8, "r_x1": 386.2, "r_y1": 454.8, "r_x2": 386.2, "r_y2": 446.9, "r_x3": 362.1, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 454.8, "r_x1": 418.8, "r_y1": 454.8, "r_x2": 418.8, "r_y2": 446.9, "r_x3": 394.6, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 454.8, "r_x1": 458.4, "r_y1": 454.8, "r_x2": 458.4, "r_y2": 446.9, "r_x3": 439.5, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 468.0, "r_x1": 272.9, "r_y1": 468.0, "r_x2": 272.9, "r_y2": 459.9, "r_x3": 245.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 468.0, "r_x1": 310.0, "r_y1": 468.0, "r_x2": 310.0, "r_y2": 459.9, "r_x3": 289.0, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 468.0, "r_x1": 347.7, "r_y1": 468.0, "r_x2": 347.7, "r_y2": 459.9, "r_x3": 326.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 468.0, "r_x1": 384.7, "r_y1": 468.0, "r_x2": 384.7, "r_y2": 459.9, "r_x3": 363.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 468.0, "r_x1": 417.2, "r_y1": 468.0, "r_x2": 417.2, "r_y2": 459.9, "r_x3": 396.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.7, "r_y0": 468.0, "r_x1": 451.3, "r_y1": 468.0, "r_x2": 451.3, "r_y2": 459.9, "r_x3": 446.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 160.4, "t": 341.7, "r": 168.0, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.4, "r_y0": 349.8, "r_x1": 168.0, "r_y1": 349.8, "r_x2": 168.0, "r_y2": 341.7, "r_x3": 160.4, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 144.6, "t": 354.7, "r": 183.8, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.6, "r_y0": 362.8, "r_x1": 183.8, "r_y1": 362.8, "r_x2": 183.8, "r_y2": 354.7, "r_x3": 144.6, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 208.0, "t": 341.7, "r": 215.7, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.0, "r_y0": 349.8, "r_x1": 215.7, "r_y1": 349.8, "r_x2": 215.7, "r_y2": 341.7, "r_x3": 208.0, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 192.2, "t": 354.7, "r": 231.4, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.2, "r_y0": 362.8, "r_x1": 231.4, "r_y1": 362.8, "r_x2": 231.4, "r_y2": 354.7, "r_x3": 192.2, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 239.8, "t": 347.2, "r": 278.3, "b": 355.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.3, "r_x1": 278.3, "r_y1": 355.3, "r_x2": 278.3, "r_y2": 347.2, "r_x3": 239.8, "r_y3": 347.2, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 324.7, "t": 341.7, "r": 348.3, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.7, "r_y0": 349.8, "r_x1": 348.3, "r_y1": 349.8, "r_x2": 348.3, "r_y2": 341.7, "r_x3": 324.7, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 396.3, "t": 341.7, "r": 417.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.3, "r_y0": 349.8, "r_x1": 417.1, "r_y1": 349.8, "r_x2": 417.1, "r_y2": 341.7, "r_x3": 396.3, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 394.9, "t": 352.7, "r": 418.5, "b": 360.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.9, "r_y0": 360.8, "r_x1": 418.5, "r_y1": 360.8, "r_x2": 418.5, "r_y2": 352.7, "r_x3": 394.9, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 430.8, "t": 341.7, "r": 467.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.8, "r_y0": 349.8, "r_x1": 467.1, "r_y1": 349.8, "r_x2": 467.1, "r_y2": 341.7, "r_x3": 430.8, "r_y3": 341.7, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 427.1, "t": 352.7, "r": 470.8, "b": 360.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.1, "r_y0": 360.8, "r_x1": 470.8, "r_y1": 360.8, "r_x2": 470.8, "r_y2": 352.7, "r_x3": 427.1, "r_y3": 352.7, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 286.7, "t": 354.7, "r": 312.3, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.7, "r_y0": 362.8, "r_x1": 312.3, "r_y1": 362.8, "r_x2": 312.3, "r_y2": 354.7, "r_x3": 286.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 320.7, "t": 354.7, "r": 353.7, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.8, "r_x1": 353.7, "r_y1": 362.8, "r_x2": 353.7, "r_y2": 354.7, "r_x3": 320.7, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 369.3, "t": 354.7, "r": 379.0, "b": 362.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.3, "r_y0": 362.8, "r_x1": 379.0, "r_y1": 362.8, "r_x2": 379.0, "r_y2": 354.7, "r_x3": 369.3, "r_y3": 354.7, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 161.9, "t": 373.5, "r": 166.5, "b": 381.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 381.6, "r_x1": 166.5, "r_y1": 381.6, "r_x2": 166.5, "r_y2": 373.5, "r_x3": 161.9, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 209.5, "t": 373.5, "r": 214.1, "b": 381.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 381.6, "r_x1": 214.1, "r_y1": 381.6, "r_x2": 214.1, "r_y2": 373.5, "r_x3": 209.5, "r_y3": 373.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 246.7, "t": 368.0, "r": 271.4, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 376.1, "r_x1": 271.4, "r_y1": 376.1, "r_x2": 271.4, "r_y2": 368.0, "r_x3": 246.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 289.0, "t": 368.0, "r": 310.0, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 376.1, "r_x1": 310.0, "r_y1": 376.1, "r_x2": 310.0, "r_y2": 368.0, "r_x3": 289.0, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 326.7, "t": 368.0, "r": 347.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 376.1, "r_x1": 347.7, "r_y1": 376.1, "r_x2": 347.7, "r_y2": 368.0, "r_x3": 326.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 363.7, "t": 368.0, "r": 384.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 376.1, "r_x1": 384.7, "r_y1": 376.1, "r_x2": 384.7, "r_y2": 368.0, "r_x3": 363.7, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 397.3, "t": 368.0, "r": 416.1, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.3, "r_y0": 375.9, "r_x1": 416.1, "r_y1": 375.9, "r_x2": 416.1, "r_y2": 368.0, "r_x3": 397.3, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 439.5, "t": 368.0, "r": 458.4, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 375.9, "r_x1": 458.4, "r_y1": 375.9, "r_x2": 458.4, "r_y2": 368.0, "r_x3": 439.5, "r_y3": 368.0, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 245.2, "t": 381.0, "r": 272.9, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 389.1, "r_x1": 272.9, "r_y1": 389.1, "r_x2": 272.9, "r_y2": 381.0, "r_x3": 245.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 289.0, "t": 381.0, "r": 310.0, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 389.1, "r_x1": 310.0, "r_y1": 389.1, "r_x2": 310.0, "r_y2": 381.0, "r_x3": 289.0, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 326.7, "t": 381.0, "r": 347.7, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 389.1, "r_x1": 347.7, "r_y1": 389.1, "r_x2": 347.7, "r_y2": 381.0, "r_x3": 326.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 363.7, "t": 381.0, "r": 384.7, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 389.1, "r_x1": 384.7, "r_y1": 389.1, "r_x2": 384.7, "r_y2": 381.0, "r_x3": 363.7, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.2, "t": 381.0, "r": 417.2, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 389.1, "r_x1": 417.2, "r_y1": 389.1, "r_x2": 417.2, "r_y2": 381.0, "r_x3": 396.2, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 440.8, "t": 381.0, "r": 457.1, "b": 389.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 389.1, "r_x1": 457.1, "r_y1": 389.1, "r_x2": 457.1, "r_y2": 381.0, "r_x3": 440.8, "r_y3": 381.0, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 161.9, "t": 399.8, "r": 166.5, "b": 407.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 407.9, "r_x1": 166.5, "r_y1": 407.9, "r_x2": 166.5, "r_y2": 399.8, "r_x3": 161.9, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 209.5, "t": 399.8, "r": 214.1, "b": 407.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 407.9, "r_x1": 214.1, "r_y1": 407.9, "r_x2": 214.1, "r_y2": 399.8, "r_x3": 209.5, "r_y3": 399.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 246.7, "t": 394.3, "r": 271.4, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 402.4, "r_x1": 271.4, "r_y1": 402.4, "r_x2": 271.4, "r_y2": 394.3, "r_x3": 246.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 289.0, "t": 394.3, "r": 310.0, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 402.4, "r_x1": 310.0, "r_y1": 402.4, "r_x2": 310.0, "r_y2": 394.3, "r_x3": 289.0, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 326.7, "t": 394.3, "r": 347.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 402.4, "r_x1": 347.7, "r_y1": 402.4, "r_x2": 347.7, "r_y2": 394.3, "r_x3": 326.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 363.7, "t": 394.3, "r": 384.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 402.4, "r_x1": 384.7, "r_y1": 402.4, "r_x2": 384.7, "r_y2": 394.3, "r_x3": 363.7, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 394.6, "t": 394.3, "r": 418.8, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 402.2, "r_x1": 418.8, "r_y1": 402.2, "r_x2": 418.8, "r_y2": 394.3, "r_x3": 394.6, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 439.5, "t": 394.3, "r": 458.4, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 402.2, "r_x1": 458.4, "r_y1": 402.2, "r_x2": 458.4, "r_y2": 394.3, "r_x3": 439.5, "r_y3": 394.3, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 245.2, "t": 407.3, "r": 272.9, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 415.4, "r_x1": 272.9, "r_y1": 415.4, "r_x2": 272.9, "r_y2": 407.3, "r_x3": 245.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 289.0, "t": 407.3, "r": 310.0, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 415.4, "r_x1": 310.0, "r_y1": 415.4, "r_x2": 310.0, "r_y2": 407.3, "r_x3": 289.0, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 326.7, "t": 407.3, "r": 347.7, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 415.4, "r_x1": 347.7, "r_y1": 415.4, "r_x2": 347.7, "r_y2": 407.3, "r_x3": 326.7, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 362.1, "t": 407.2, "r": 386.2, "b": 415.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 415.2, "r_x1": 386.2, "r_y1": 415.2, "r_x2": 386.2, "r_y2": 407.2, "r_x3": 362.1, "r_y3": 407.2, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 396.2, "t": 407.3, "r": 417.2, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 415.4, "r_x1": 417.2, "r_y1": 415.4, "r_x2": 417.2, "r_y2": 407.3, "r_x3": 396.2, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 440.8, "t": 407.3, "r": 457.1, "b": 415.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 415.4, "r_x1": 457.1, "r_y1": 415.4, "r_x2": 457.1, "r_y2": 407.3, "r_x3": 440.8, "r_y3": 407.3, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 161.9, "t": 426.1, "r": 166.5, "b": 434.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 434.2, "r_x1": 166.5, "r_y1": 434.2, "r_x2": 166.5, "r_y2": 426.1, "r_x3": 161.9, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 209.5, "t": 426.1, "r": 214.1, "b": 434.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 434.2, "r_x1": 214.1, "r_y1": 434.2, "r_x2": 214.1, "r_y2": 426.1, "r_x3": 209.5, "r_y3": 426.1, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 246.7, "t": 420.6, "r": 271.4, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 428.7, "r_x1": 271.4, "r_y1": 428.7, "r_x2": 271.4, "r_y2": 420.6, "r_x3": 246.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 289.0, "t": 420.6, "r": 310.0, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 428.7, "r_x1": 310.0, "r_y1": 428.7, "r_x2": 310.0, "r_y2": 420.6, "r_x3": 289.0, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.7, "t": 420.6, "r": 347.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 428.7, "r_x1": 347.7, "r_y1": 428.7, "r_x2": 347.7, "r_y2": 420.6, "r_x3": 326.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 363.7, "t": 420.6, "r": 384.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 428.7, "r_x1": 384.7, "r_y1": 428.7, "r_x2": 384.7, "r_y2": 420.6, "r_x3": 363.7, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 394.6, "t": 420.6, "r": 418.8, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 428.5, "r_x1": 418.8, "r_y1": 428.5, "r_x2": 418.8, "r_y2": 420.6, "r_x3": 394.6, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 439.5, "t": 420.6, "r": 458.4, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 428.5, "r_x1": 458.4, "r_y1": 428.5, "r_x2": 458.4, "r_y2": 420.6, "r_x3": 439.5, "r_y3": 420.6, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 245.2, "t": 433.6, "r": 272.9, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 441.7, "r_x1": 272.9, "r_y1": 441.7, "r_x2": 272.9, "r_y2": 433.6, "r_x3": 245.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 289.0, "t": 433.6, "r": 310.0, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 441.7, "r_x1": 310.0, "r_y1": 441.7, "r_x2": 310.0, "r_y2": 433.6, "r_x3": 289.0, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 326.7, "t": 433.6, "r": 347.7, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 441.7, "r_x1": 347.7, "r_y1": 441.7, "r_x2": 347.7, "r_y2": 433.6, "r_x3": 326.7, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 362.1, "t": 433.5, "r": 386.2, "b": 441.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 441.5, "r_x1": 386.2, "r_y1": 441.5, "r_x2": 386.2, "r_y2": 433.5, "r_x3": 362.1, "r_y3": 433.5, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 396.2, "t": 433.6, "r": 417.2, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 441.7, "r_x1": 417.2, "r_y1": 441.7, "r_x2": 417.2, "r_y2": 433.6, "r_x3": 396.2, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 440.8, "t": 433.6, "r": 457.1, "b": 441.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 441.7, "r_x1": 457.1, "r_y1": 441.7, "r_x2": 457.1, "r_y2": 433.6, "r_x3": 440.8, "r_y3": 433.6, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 161.9, "t": 452.4, "r": 166.5, "b": 460.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.9, "r_y0": 460.5, "r_x1": 166.5, "r_y1": 460.5, "r_x2": 166.5, "r_y2": 452.4, "r_x3": 161.9, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 209.5, "t": 452.4, "r": 214.1, "b": 460.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.5, "r_y0": 460.5, "r_x1": 214.1, "r_y1": 460.5, "r_x2": 214.1, "r_y2": 452.4, "r_x3": 209.5, "r_y3": 452.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 246.7, "t": 446.9, "r": 271.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.7, "r_y0": 455.0, "r_x1": 271.4, "r_y1": 455.0, "r_x2": 271.4, "r_y2": 446.9, "r_x3": 246.7, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 289.0, "t": 446.9, "r": 310.0, "b": 455.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 455.0, "r_x1": 310.0, "r_y1": 455.0, "r_x2": 310.0, "r_y2": 446.9, "r_x3": 289.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 329.0, "t": 446.9, "r": 345.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.0, "r_y0": 455.0, "r_x1": 345.4, "r_y1": 455.0, "r_x2": 345.4, "r_y2": 446.9, "r_x3": 329.0, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 362.1, "t": 446.9, "r": 386.2, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.1, "r_y0": 454.8, "r_x1": 386.2, "r_y1": 454.8, "r_x2": 386.2, "r_y2": 446.9, "r_x3": 362.1, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.6, "t": 446.9, "r": 418.8, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.6, "r_y0": 454.8, "r_x1": 418.8, "r_y1": 454.8, "r_x2": 418.8, "r_y2": 446.9, "r_x3": 394.6, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 439.5, "t": 446.9, "r": 458.4, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.5, "r_y0": 454.8, "r_x1": 458.4, "r_y1": 454.8, "r_x2": 458.4, "r_y2": 446.9, "r_x3": 439.5, "r_y3": 446.9, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 245.2, "t": 459.9, "r": 272.9, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.2, "r_y0": 468.0, "r_x1": 272.9, "r_y1": 468.0, "r_x2": 272.9, "r_y2": 459.9, "r_x3": 245.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.0, "t": 459.9, "r": 310.0, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.0, "r_y0": 468.0, "r_x1": 310.0, "r_y1": 468.0, "r_x2": 310.0, "r_y2": 459.9, "r_x3": 289.0, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 326.7, "t": 459.9, "r": 347.7, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.7, "r_y0": 468.0, "r_x1": 347.7, "r_y1": 468.0, "r_x2": 347.7, "r_y2": 459.9, "r_x3": 326.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 363.7, "t": 459.9, "r": 384.7, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.7, "r_y0": 468.0, "r_x1": 384.7, "r_y1": 468.0, "r_x2": 384.7, "r_y2": 459.9, "r_x3": 363.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 396.2, "t": 459.9, "r": 417.2, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.2, "r_y0": 468.0, "r_x1": 417.2, "r_y1": 468.0, "r_x2": 417.2, "r_y2": 459.9, "r_x3": 396.2, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 446.7, "t": 459.9, "r": 451.3, "b": 468.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.7, "r_y0": 468.0, "r_x1": 451.3, "r_y1": 468.0, "r_x2": 451.3, "r_y2": 459.9, "r_x3": 446.7, "r_y3": 459.9, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 6, "num_cols": 8, "table_cells": [ { "bbox": { "l": 160.4, "t": 341.7, "r": 168.0, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "# enc-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 208.0, "t": 341.7, "r": 215.7, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "# dec-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 239.8, "t": 347.2, "r": 278.3, "b": 355.3, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 324.7, "t": 341.7, "r": 348.3, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 6, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 396.3, "t": 341.7, "r": 417.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 394.9, "t": 352.7, "r": 418.5, "b": 360.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 430.8, "t": 341.7, "r": 467.1, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "Inference", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.1, "t": 352.7, "r": 470.8, "b": 360.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 286.7, "t": 354.7, "r": 312.3, "b": 362.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 320.7, "t": 354.7, "r": 353.7, "b": 362.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 369.3, "t": 354.7, "r": 379.0, "b": 362.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 161.9, "t": 373.5, "r": 166.5, "b": 381.6, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.5, "t": 373.5, "r": 214.1, "b": 381.6, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.7, "t": 368.0, "r": 271.4, "b": 376.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.0, "t": 368.0, "r": 310.0, "b": 376.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.7, "t": 368.0, "r": 347.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.7, "t": 368.0, "r": 384.7, "b": 376.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 397.3, "t": 368.0, "r": 416.1, "b": 375.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.5, "t": 368.0, "r": 458.4, "b": 375.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.9, "t": 399.8, "r": 166.5, "b": 407.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.5, "t": 399.8, "r": 214.1, "b": 407.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.7, "t": 394.3, "r": 271.4, "b": 402.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.0, "t": 394.3, "r": 310.0, "b": 402.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.938 0.952", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.7, "t": 394.3, "r": 347.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.904 0.909", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.7, "t": 394.3, "r": 384.7, "b": 402.4, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.927 0.938", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.6, "t": 394.3, "r": 418.8, "b": 402.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.853 0.843", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.5, "t": 394.3, "r": 458.4, "b": 402.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.97 3.77", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.9, "t": 426.1, "r": 166.5, "b": 434.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.5, "t": 426.1, "r": 214.1, "b": 434.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.7, "t": 420.6, "r": 271.4, "b": 428.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.0, "t": 420.6, "r": 310.0, "b": 428.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.923 0.945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.7, "t": 420.6, "r": 347.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.897 0.901", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.7, "t": 420.6, "r": 384.7, "b": 428.7, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.915 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.6, "t": 420.6, "r": 418.8, "b": 428.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.859 0.834", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.5, "t": 420.6, "r": 458.4, "b": 428.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.91 3.81", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.9, "t": 452.4, "r": 166.5, "b": 460.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.5, "t": 452.4, "r": 214.1, "b": 460.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.7, "t": 446.9, "r": 271.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.0, "t": 446.9, "r": 310.0, "b": 455.0, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.952 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 329.0, "t": 446.9, "r": 345.4, "b": 455.0, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.92 0.903", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 362.1, "t": 446.9, "r": 386.2, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.942 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.6, "t": 446.9, "r": 418.8, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.857 0.824", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.5, "t": 446.9, "r": 458.4, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.22 2", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "section_header", "id": 5, "page_no": 8, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.8, "t": 508.2, "r": 264.4, "b": 517.0, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 517.0, "r_x1": 149.4, "r_y1": 517.0, "r_x2": 149.4, "r_y2": 508.2, "r_x3": 134.8, "r_y3": 508.2, "coord_origin": "TOPLEFT" }, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 517.0, "r_x1": 264.4, "r_y1": 517.0, "r_x2": 264.4, "r_y2": 508.2, "r_x3": 160.9, "r_y3": 508.2, "coord_origin": "TOPLEFT" }, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.2 Quantitative Results" }, { "label": "text", "id": 1, "page_no": 8, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 524.6, "r": 480.6, "b": 617.0, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 524.6, "r_x3": 134.8, "r_y3": 524.6, "coord_origin": "TOPLEFT" }, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 545.3, "r_x1": 480.6, "r_y1": 545.3, "r_x2": 480.6, "r_y2": 536.5, "r_x3": 134.8, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 557.3, "r_x1": 480.6, "r_y1": 557.3, "r_x2": 480.6, "r_y2": 548.5, "r_x3": 134.8, "r_y3": 548.5, "coord_origin": "TOPLEFT" }, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 569.2, "r_x1": 480.6, "r_y1": 569.2, "r_x2": 480.6, "r_y2": 560.4, "r_x3": 134.8, "r_y3": 560.4, "coord_origin": "TOPLEFT" }, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 581.2, "r_x1": 480.6, "r_y1": 581.2, "r_x2": 480.6, "r_y2": 572.4, "r_x3": 134.8, "r_y3": 572.4, "coord_origin": "TOPLEFT" }, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 593.1, "r_x1": 480.6, "r_y1": 593.1, "r_x2": 480.6, "r_y2": 584.3, "r_x3": 134.8, "r_y3": 584.3, "coord_origin": "TOPLEFT" }, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 605.1, "r_x1": 480.6, "r_y1": 605.1, "r_x2": 480.6, "r_y2": 596.3, "r_x3": 134.8, "r_y3": 596.3, "coord_origin": "TOPLEFT" }, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 617.0, "r_x1": 206.8, "r_y1": 617.0, "r_x2": 206.8, "r_y2": 608.2, "r_x3": 134.8, "r_y3": 608.2, "coord_origin": "TOPLEFT" }, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We picked the model parameter configuration that produced the best prediction quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently trained and evaluated it on three publicly available data sets: PubTabNet (395k samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples). Performance results are presented in Table. 2. It is clearly evident that the model trained on OTSL outperforms HTML across the board, keeping high TEDs and mAP scores even on difficult financial tables (FinTabNet) that contain sparse and large tables." }, { "label": "text", "id": 2, "page_no": 8, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 620.2, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 629.0, "r_x1": 480.6, "r_y1": 629.0, "r_x2": 480.6, "r_y2": 620.2, "r_x3": 149.7, "r_y3": 620.2, "coord_origin": "TOPLEFT" }, "text": "Additionally, the results show that OTSL has an advantage over HTML", "orig": "Additionally, the results show that OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 640.9, "r_x1": 480.6, "r_y1": 640.9, "r_x2": 480.6, "r_y2": 632.1, "r_x3": 134.8, "r_y3": 632.1, "coord_origin": "TOPLEFT" }, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.8, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 664.9, "r_x1": 405.8, "r_y1": 664.9, "r_x2": 405.8, "r_y2": 656.1, "r_x3": 134.8, "r_y3": 656.1, "coord_origin": "TOPLEFT" }, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Additionally, the results show that OTSL has an advantage over HTML when applied on a bigger data set like PubTables-1M and achieves significantly improved scores. Finally, OTSL achieves faster inference due to fewer decoding steps which is a result of the reduced sequence representation." } ], "headers": [ { "label": "page_header", "id": 8, "page_no": 8, "cluster": { "id": 8, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 9, "page_no": 8, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 476.0, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 476.0, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 476.0, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9" } ] } }, { "page_no": 9, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 144.0, "r_y1": 101.8, "r_x2": 144.0, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 123.8, "r_x1": 173.1, "r_y1": 123.8, "r_x2": 173.1, "r_y2": 115.8, "r_x3": 134.8, "r_y3": 115.8, "coord_origin": "TOPLEFT" }, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.3, "r_y0": 124.0, "r_x1": 480.6, "r_y1": 124.0, "r_x2": 480.6, "r_y2": 115.9, "r_x3": 181.3, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 134.9, "r_x1": 480.6, "r_y1": 134.9, "r_x2": 480.6, "r_y2": 126.9, "r_x3": 134.8, "r_y3": 126.9, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 145.9, "r_x1": 306.0, "r_y1": 145.9, "r_x2": 306.0, "r_y2": 137.8, "r_x3": 134.8, "r_y3": 137.8, "coord_origin": "TOPLEFT" }, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.8, "r_y0": 174.6, "r_x1": 195.0, "r_y1": 174.6, "r_x2": 195.0, "r_y2": 166.6, "r_x3": 160.8, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.5, "r_y0": 174.6, "r_x1": 254.0, "r_y1": 174.6, "r_x2": 254.0, "r_y2": 166.5, "r_x3": 215.5, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.1, "r_x1": 324.0, "r_y1": 169.1, "r_x2": 324.0, "r_y2": 161.1, "r_x3": 300.4, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.3, "r_y0": 174.6, "r_x1": 414.7, "r_y1": 174.6, "r_x2": 414.7, "r_y2": 166.6, "r_x3": 370.3, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.7, "r_y0": 169.1, "r_x1": 463.1, "r_y1": 169.1, "r_x2": 463.1, "r_y2": 161.1, "r_x3": 426.7, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.1, "r_y0": 180.1, "r_x1": 466.7, "r_y1": 180.1, "r_x2": 466.7, "r_y2": 172.0, "r_x3": 423.1, "r_y3": 172.0, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.4, "r_y0": 182.1, "r_x1": 288.1, "r_y1": 182.1, "r_x2": 288.1, "r_y2": 174.0, "r_x3": 262.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.4, "r_y0": 182.1, "r_x1": 329.4, "r_y1": 182.1, "r_x2": 329.4, "r_y2": 174.0, "r_x3": 296.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.0, "r_y0": 182.1, "r_x1": 354.8, "r_y1": 182.1, "r_x2": 354.8, "r_y2": 174.0, "r_x3": 345.0, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 200.9, "r_x1": 201.2, "r_y1": 200.9, "r_x2": 201.2, "r_y2": 192.9, "r_x3": 154.5, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 195.5, "r_x1": 247.1, "r_y1": 195.5, "r_x2": 247.1, "r_y2": 187.4, "r_x3": 222.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 195.5, "r_x1": 285.7, "r_y1": 195.5, "r_x2": 285.7, "r_y2": 187.4, "r_x3": 264.7, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 195.5, "r_x1": 323.4, "r_y1": 195.5, "r_x2": 323.4, "r_y2": 187.4, "r_x3": 302.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.5, "r_x1": 360.4, "r_y1": 195.5, "r_x2": 360.4, "r_y2": 187.4, "r_x3": 339.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.1, "r_y0": 195.2, "r_x1": 402.0, "r_y1": 195.2, "r_x2": 402.0, "r_y2": 187.3, "r_x3": 383.1, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 195.2, "r_x1": 454.4, "r_y1": 195.2, "r_x2": 454.4, "r_y2": 187.3, "r_x3": 435.5, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.7, "r_y1": 208.4, "r_x2": 248.7, "r_y2": 200.3, "r_x3": 220.9, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 208.4, "r_x1": 285.7, "r_y1": 208.4, "r_x2": 285.7, "r_y2": 200.3, "r_x3": 264.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 208.4, "r_x1": 323.4, "r_y1": 208.4, "r_x2": 323.4, "r_y2": 200.3, "r_x3": 302.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.4, "r_y1": 208.4, "r_x2": 360.4, "r_y2": 200.3, "r_x3": 339.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 208.4, "r_x1": 403.0, "r_y1": 208.4, "r_x2": 403.0, "r_y2": 200.3, "r_x3": 382.1, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 208.4, "r_x1": 453.1, "r_y1": 208.4, "r_x2": 453.1, "r_y2": 200.3, "r_x3": 436.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.9, "r_y0": 227.2, "r_x1": 199.8, "r_y1": 227.2, "r_x2": 199.8, "r_y2": 219.2, "r_x3": 155.9, "r_y3": 219.2, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 221.8, "r_x1": 247.1, "r_y1": 221.8, "r_x2": 247.1, "r_y2": 213.7, "r_x3": 222.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 221.8, "r_x1": 285.7, "r_y1": 221.8, "r_x2": 285.7, "r_y2": 213.7, "r_x3": 264.7, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 221.8, "r_x1": 323.4, "r_y1": 221.8, "r_x2": 323.4, "r_y2": 213.7, "r_x3": 302.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 221.5, "r_x1": 362.0, "r_y1": 221.5, "r_x2": 362.0, "r_y2": 213.6, "r_x3": 337.8, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 221.5, "r_x1": 404.6, "r_y1": 221.5, "r_x2": 404.6, "r_y2": 213.6, "r_x3": 380.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 221.5, "r_x1": 454.4, "r_y1": 221.5, "r_x2": 454.4, "r_y2": 213.6, "r_x3": 435.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.7, "r_y1": 234.7, "r_x2": 248.7, "r_y2": 226.6, "r_x3": 220.9, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 234.7, "r_x1": 285.7, "r_y1": 234.7, "r_x2": 285.7, "r_y2": 226.6, "r_x3": 264.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 234.7, "r_x1": 323.4, "r_y1": 234.7, "r_x2": 323.4, "r_y2": 226.6, "r_x3": 302.4, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.7, "r_y0": 234.7, "r_x1": 358.1, "r_y1": 234.7, "r_x2": 358.1, "r_y2": 226.6, "r_x3": 341.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 234.7, "r_x1": 403.0, "r_y1": 234.7, "r_x2": 403.0, "r_y2": 226.6, "r_x3": 382.1, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 234.7, "r_x1": 453.1, "r_y1": 234.7, "r_x2": 453.1, "r_y2": 226.6, "r_x3": 436.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.6, "r_y0": 253.5, "r_x1": 207.2, "r_y1": 253.5, "r_x2": 207.2, "r_y2": 245.5, "r_x3": 148.6, "r_y3": 245.5, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 248.1, "r_x1": 247.1, "r_y1": 248.1, "r_x2": 247.1, "r_y2": 240.0, "r_x3": 222.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 248.1, "r_x1": 285.7, "r_y1": 248.1, "r_x2": 285.7, "r_y2": 240.0, "r_x3": 264.7, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 248.1, "r_x1": 323.4, "r_y1": 248.1, "r_x2": 323.4, "r_y2": 240.0, "r_x3": 302.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 247.8, "r_x1": 362.0, "r_y1": 247.8, "r_x2": 362.0, "r_y2": 239.9, "r_x3": 337.8, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 247.8, "r_x1": 404.6, "r_y1": 247.8, "r_x2": 404.6, "r_y2": 239.9, "r_x3": 380.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 247.8, "r_x1": 454.4, "r_y1": 247.8, "r_x2": 454.4, "r_y2": 239.9, "r_x3": 435.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.7, "r_y1": 261.0, "r_x2": 248.7, "r_y2": 252.9, "r_x3": 220.9, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 261.0, "r_x1": 285.7, "r_y1": 261.0, "r_x2": 285.7, "r_y2": 252.9, "r_x3": 264.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 261.0, "r_x1": 323.4, "r_y1": 261.0, "r_x2": 323.4, "r_y2": 252.9, "r_x3": 302.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.4, "r_y1": 261.0, "r_x2": 360.4, "r_y2": 252.9, "r_x3": 339.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 261.0, "r_x1": 403.0, "r_y1": 261.0, "r_x2": 403.0, "r_y2": 252.9, "r_x3": 382.1, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 261.0, "r_x1": 453.1, "r_y1": 261.0, "r_x2": 453.1, "r_y2": 252.9, "r_x3": 436.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 297.7, "r_x1": 149.4, "r_y1": 297.7, "r_x2": 149.4, "r_y2": 288.9, "r_x3": 134.8, "r_y3": 288.9, "coord_origin": "TOPLEFT" }, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 297.7, "r_x1": 257.1, "r_y1": 297.7, "r_x2": 257.1, "r_y2": 288.9, "r_x3": 160.9, "r_y3": 288.9, "coord_origin": "TOPLEFT" }, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 318.7, "r_x1": 480.6, "r_y1": 318.7, "r_x2": 480.6, "r_y2": 309.9, "r_x3": 134.8, "r_y3": 309.9, "coord_origin": "TOPLEFT" }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "orig": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 330.6, "r_x1": 480.6, "r_y1": 330.6, "r_x2": 480.6, "r_y2": 321.8, "r_x3": 134.8, "r_y3": 321.8, "coord_origin": "TOPLEFT" }, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 342.6, "r_x1": 480.6, "r_y1": 342.6, "r_x2": 480.6, "r_y2": 333.8, "r_x3": 134.8, "r_y3": 333.8, "coord_origin": "TOPLEFT" }, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 354.5, "r_x1": 480.6, "r_y1": 354.5, "r_x2": 480.6, "r_y2": 345.7, "r_x3": 134.8, "r_y3": 345.7, "coord_origin": "TOPLEFT" }, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 366.5, "r_x1": 161.7, "r_y1": 366.5, "r_x2": 161.7, "r_y2": 357.7, "r_x3": 134.8, "r_y3": 357.7, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 405.5, "r_x1": 162.6, "r_y1": 405.5, "r_x2": 162.6, "r_y2": 397.6, "r_x3": 134.8, "r_y3": 397.6, "coord_origin": "TOPLEFT" }, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.4, "r_y0": 405.7, "r_x1": 480.6, "r_y1": 405.7, "r_x2": 480.6, "r_y2": 397.7, "r_x3": 167.4, "r_y3": 397.7, "coord_origin": "TOPLEFT" }, "text": "The OTSL model produces more accurate bounding boxes with less over-", "orig": "The OTSL model produces more accurate bounding boxes with less over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 416.7, "r_x1": 480.6, "r_y1": 416.7, "r_x2": 480.6, "r_y2": 408.6, "r_x3": 134.8, "r_y3": 408.6, "coord_origin": "TOPLEFT" }, "text": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 427.6, "r_x1": 480.6, "r_y1": 427.6, "r_x2": 480.6, "r_y2": 419.6, "r_x3": 134.8, "r_y3": 419.6, "coord_origin": "TOPLEFT" }, "text": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "orig": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 438.6, "r_x1": 304.7, "r_y1": 438.6, "r_x2": 304.7, "r_y2": 430.5, "r_x3": 134.8, "r_y3": 430.5, "coord_origin": "TOPLEFT" }, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 518.9, "r_x1": 190.6, "r_y1": 518.9, "r_x2": 190.6, "r_y2": 516.2, "r_x3": 180.1, "r_y3": 516.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 522.8, "r_x1": 304.5, "r_y1": 522.8, "r_x2": 304.5, "r_y2": 520.1, "r_x3": 183.2, "r_y3": 520.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 526.7, "r_x1": 388.4, "r_y1": 526.7, "r_x2": 388.4, "r_y2": 524.0, "r_x3": 183.2, "r_y3": 524.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 530.6, "r_x1": 388.4, "r_y1": 530.6, "r_x2": 388.4, "r_y2": 527.9, "r_x3": 183.2, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 534.5, "r_x1": 388.4, "r_y1": 534.5, "r_x2": 388.4, "r_y2": 531.8, "r_x3": 183.2, "r_y3": 531.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 538.4, "r_x1": 388.4, "r_y1": 538.4, "r_x2": 388.4, "r_y2": 535.7, "r_x3": 183.2, "r_y3": 535.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 542.3, "r_x1": 388.4, "r_y1": 542.3, "r_x2": 388.4, "r_y2": 539.6, "r_x3": 183.2, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 546.2, "r_x1": 388.4, "r_y1": 546.2, "r_x2": 388.4, "r_y2": 543.5, "r_x3": 183.2, "r_y3": 543.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 550.1, "r_x1": 388.4, "r_y1": 550.1, "r_x2": 388.4, "r_y2": 547.4, "r_x3": 183.2, "r_y3": 547.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 554.0, "r_x1": 388.4, "r_y1": 554.0, "r_x2": 388.4, "r_y2": 551.3, "r_x3": 183.2, "r_y3": 551.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 557.9, "r_x1": 191.9, "r_y1": 557.9, "r_x2": 191.9, "r_y2": 555.2, "r_x3": 180.1, "r_y3": 555.2, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 521.0, "r_x1": 408.8, "r_y1": 521.0, "r_x2": 408.8, "r_y2": 518.3, "r_x3": 407.4, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 521.0, "r_x1": 450.5, "r_y1": 521.0, "r_x2": 450.5, "r_y2": 518.3, "r_x3": 410.3, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 524.9, "r_x1": 408.8, "r_y1": 524.9, "r_x2": 408.8, "r_y2": 522.2, "r_x3": 407.4, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 524.9, "r_x1": 450.5, "r_y1": 524.9, "r_x2": 450.5, "r_y2": 522.2, "r_x3": 410.3, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 528.8, "r_x1": 408.8, "r_y1": 528.8, "r_x2": 408.8, "r_y2": 526.1, "r_x3": 407.4, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 528.8, "r_x1": 450.5, "r_y1": 528.8, "r_x2": 450.5, "r_y2": 526.1, "r_x3": 410.3, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 532.7, "r_x1": 408.8, "r_y1": 532.7, "r_x2": 408.8, "r_y2": 530.0, "r_x3": 407.4, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 532.7, "r_x1": 450.5, "r_y1": 532.7, "r_x2": 450.5, "r_y2": 530.0, "r_x3": 410.3, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 536.6, "r_x1": 408.8, "r_y1": 536.6, "r_x2": 408.8, "r_y2": 533.9, "r_x3": 407.4, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 536.6, "r_x1": 450.5, "r_y1": 536.6, "r_x2": 450.5, "r_y2": 533.9, "r_x3": 410.3, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 540.5, "r_x1": 408.8, "r_y1": 540.5, "r_x2": 408.8, "r_y2": 537.8, "r_x3": 407.4, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 540.5, "r_x1": 450.5, "r_y1": 540.5, "r_x2": 450.5, "r_y2": 537.8, "r_x3": 410.3, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 544.4, "r_x1": 408.8, "r_y1": 544.4, "r_x2": 408.8, "r_y2": 541.7, "r_x3": 407.4, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 544.4, "r_x1": 450.5, "r_y1": 544.4, "r_x2": 450.5, "r_y2": 541.7, "r_x3": 410.3, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 548.3, "r_x1": 408.8, "r_y1": 548.3, "r_x2": 408.8, "r_y2": 545.6, "r_x3": 407.4, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 548.3, "r_x1": 450.5, "r_y1": 548.3, "r_x2": 450.5, "r_y2": 545.6, "r_x3": 410.3, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 552.2, "r_x1": 408.8, "r_y1": 552.2, "r_x2": 408.8, "r_y2": 549.5, "r_x3": 407.4, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 552.2, "r_x1": 450.5, "r_y1": 552.2, "r_x2": 450.5, "r_y2": 549.5, "r_x3": 410.3, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.5, "r_y0": 515.3, "r_x1": 181.9, "r_y1": 515.3, "r_x2": 181.9, "r_y2": 509.5, "r_x3": 164.5, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.6, "r_y0": 515.3, "r_x1": 186.4, "r_y1": 515.3, "r_x2": 186.4, "r_y2": 509.5, "r_x3": 183.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2, "r_y0": 515.3, "r_x1": 208.9, "r_y1": 515.3, "r_x2": 208.9, "r_y2": 509.5, "r_x3": 189.2, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.6, "r_y0": 515.3, "r_x1": 221.0, "r_y1": 515.3, "r_x2": 221.0, "r_y2": 509.5, "r_x3": 210.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.5, "r_x1": 406.8, "r_y1": 515.5, "r_x2": 406.8, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.6, "r_y0": 515.5, "r_x1": 411.4, "r_y1": 515.5, "r_x2": 411.4, "r_y2": 509.6, "r_x3": 408.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.5, "r_x1": 433.9, "r_y1": 515.5, "r_x2": 433.9, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 515.5, "r_x1": 446.0, "r_y1": 515.5, "r_x2": 446.0, "r_y2": 509.6, "r_x3": 435.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.2, "r_y0": 526.4, "r_x1": 172.8, "r_y1": 526.4, "r_x2": 172.8, "r_y2": 519.1, "r_x3": 167.2, "r_y3": 519.1, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.3, "r_y0": 455.9, "r_x1": 193.0, "r_y1": 455.9, "r_x2": 193.0, "r_y2": 448.6, "r_x3": 187.3, "r_y3": 448.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.4, "r_y0": 573.3, "r_x1": 173.0, "r_y1": 573.3, "r_x2": 173.0, "r_y2": 566.0, "r_x3": 167.4, "r_y3": 566.0, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.5, "r_y0": 629.1, "r_x1": 253.7, "r_y1": 629.1, "r_x2": 253.7, "r_y2": 621.8, "r_x3": 248.5, "r_y3": 621.8, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.5, "r_x1": 401.5, "r_y1": 526.5, "r_x2": 401.5, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.6, "r_y0": 597.3, "r_x1": 177.5, "r_y1": 597.3, "r_x2": 177.5, "r_y2": 580.3, "r_x3": 171.6, "r_y3": 580.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.1, "r_y0": 649.9, "r_x1": 256.9, "r_y1": 649.9, "r_x2": 256.9, "r_y2": 633.6, "r_x3": 251.1, "r_y3": 633.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 607.3, "r_x1": 427.0, "r_y1": 607.3, "r_x2": 427.0, "r_y2": 601.5, "r_x3": 372.1, "r_y3": 601.5, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 613.8, "r_x1": 430.1, "r_y1": 613.8, "r_x2": 430.1, "r_y2": 607.9, "r_x3": 372.1, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 648.7, "r_x1": 231.1, "r_y1": 648.7, "r_x2": 231.1, "r_y2": 642.9, "r_x3": 176.9, "r_y3": 642.9, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 655.2, "r_x1": 231.0, "r_y1": 655.2, "r_x2": 231.0, "r_y2": 649.3, "r_x3": 176.9, "r_y3": 649.3, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 661.6, "r_x1": 203.9, "r_y1": 661.6, "r_x2": 203.9, "r_y2": 655.8, "r_x3": 176.9, "r_y3": 655.8, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.9, "r_y0": 569.2, "r_x1": 218.5, "r_y1": 569.2, "r_x2": 218.5, "r_y2": 557.6, "r_x3": 215.9, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.1, "r_y0": 569.2, "r_x1": 231.7, "r_y1": 569.2, "r_x2": 231.7, "r_y2": 557.6, "r_x3": 229.1, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 342.6, "r_y0": 439.7, "r_x1": 344.8, "r_y1": 439.7, "r_x2": 344.8, "r_y2": 430.2, "r_x3": 342.6, "r_y3": 430.2, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.2, "r_y0": 451.2, "r_x1": 263.6, "r_y1": 451.2, "r_x2": 263.6, "r_y2": 448.5, "r_x3": 261.2, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.3, "r_y0": 451.2, "r_x1": 313.6, "r_y1": 451.2, "r_x2": 313.6, "r_y2": 448.5, "r_x3": 312.3, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.4, "r_y0": 451.2, "r_x1": 380.1, "r_y1": 451.2, "r_x2": 380.1, "r_y2": 448.5, "r_x3": 377.4, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 456.1, "r_x1": 205.8, "r_y1": 456.1, "r_x2": 205.8, "r_y2": 453.3, "r_x3": 200.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.2, "r_y0": 456.1, "r_x1": 229.8, "r_y1": 456.1, "r_x2": 229.8, "r_y2": 453.3, "r_x3": 222.2, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 456.1, "r_x1": 250.8, "r_y1": 456.1, "r_x2": 250.8, "r_y2": 453.3, "r_x3": 243.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.1, "r_x1": 271.8, "r_y1": 456.1, "r_x2": 271.8, "r_y2": 453.3, "r_x3": 264.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.3, "r_y0": 456.1, "r_x1": 292.9, "r_y1": 456.1, "r_x2": 292.9, "r_y2": 453.3, "r_x3": 285.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 456.1, "r_x1": 311.8, "r_y1": 456.1, "r_x2": 311.8, "r_y2": 453.3, "r_x3": 306.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 456.1, "r_x1": 325.6, "r_y1": 456.1, "r_x2": 325.6, "r_y2": 453.3, "r_x3": 323.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 456.1, "r_x1": 336.6, "r_y1": 456.1, "r_x2": 336.6, "r_y2": 453.3, "r_x3": 334.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 456.1, "r_x1": 347.7, "r_y1": 456.1, "r_x2": 347.7, "r_y2": 453.3, "r_x3": 345.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 456.1, "r_x1": 358.7, "r_y1": 456.1, "r_x2": 358.7, "r_y2": 453.3, "r_x3": 356.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 456.1, "r_x1": 372.0, "r_y1": 456.1, "r_x2": 372.0, "r_y2": 453.3, "r_x3": 367.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 456.1, "r_x1": 387.0, "r_y1": 456.1, "r_x2": 387.0, "r_y2": 453.3, "r_x3": 382.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 456.1, "r_x1": 402.1, "r_y1": 456.1, "r_x2": 402.1, "r_y2": 453.3, "r_x3": 397.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 457.8, "r_x1": 414.9, "r_y1": 457.8, "r_x2": 414.9, "r_y2": 448.0, "r_x3": 412.8, "r_y3": 448.0, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.0, "r_y0": 456.1, "r_x1": 422.5, "r_y1": 456.1, "r_x2": 422.5, "r_y2": 453.3, "r_x3": 415.0, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 466.7, "r_x1": 204.6, "r_y1": 466.7, "r_x2": 204.6, "r_y2": 463.9, "r_x3": 200.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 466.7, "r_x1": 369.6, "r_y1": 466.7, "r_x2": 369.6, "r_y2": 463.9, "r_x3": 367.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 466.7, "r_x1": 384.6, "r_y1": 466.7, "r_x2": 384.6, "r_y2": 463.9, "r_x3": 382.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 466.7, "r_x1": 399.7, "r_y1": 466.7, "r_x2": 399.7, "r_y2": 463.9, "r_x3": 397.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 471.5, "r_x1": 206.5, "r_y1": 471.5, "r_x2": 206.5, "r_y2": 468.8, "r_x3": 200.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 471.5, "r_x1": 266.3, "r_y1": 471.5, "r_x2": 266.3, "r_y2": 468.8, "r_x3": 264.3, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 471.5, "r_x1": 308.3, "r_y1": 471.5, "r_x2": 308.3, "r_y2": 468.8, "r_x3": 306.4, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 471.5, "r_x1": 347.5, "r_y1": 471.5, "r_x2": 347.5, "r_y2": 468.8, "r_x3": 345.5, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 471.5, "r_x1": 358.5, "r_y1": 471.5, "r_x2": 358.5, "r_y2": 468.8, "r_x3": 356.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 471.5, "r_x1": 369.6, "r_y1": 471.5, "r_x2": 369.6, "r_y2": 468.8, "r_x3": 367.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 471.5, "r_x1": 384.6, "r_y1": 471.5, "r_x2": 384.6, "r_y2": 468.8, "r_x3": 382.7, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 476.4, "r_x1": 206.5, "r_y1": 476.4, "r_x2": 206.5, "r_y2": 473.7, "r_x3": 200.6, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 476.4, "r_x1": 266.3, "r_y1": 476.4, "r_x2": 266.3, "r_y2": 473.7, "r_x3": 264.3, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 481.3, "r_x1": 206.5, "r_y1": 481.3, "r_x2": 206.5, "r_y2": 478.5, "r_x3": 200.6, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 481.3, "r_x1": 245.2, "r_y1": 481.3, "r_x2": 245.2, "r_y2": 478.5, "r_x3": 243.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 481.3, "r_x1": 266.3, "r_y1": 481.3, "r_x2": 266.3, "r_y2": 478.5, "r_x3": 264.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.3, "r_x1": 325.4, "r_y1": 481.3, "r_x2": 325.4, "r_y2": 478.5, "r_x3": 323.4, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 481.3, "r_x1": 399.7, "r_y1": 481.3, "r_x2": 399.7, "r_y2": 478.5, "r_x3": 397.7, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 486.1, "r_x1": 206.5, "r_y1": 486.1, "r_x2": 206.5, "r_y2": 483.4, "r_x3": 200.6, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 486.1, "r_x1": 384.6, "r_y1": 486.1, "r_x2": 384.6, "r_y2": 483.4, "r_x3": 382.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 486.1, "r_x1": 401.6, "r_y1": 486.1, "r_x2": 401.6, "r_y2": 483.4, "r_x3": 397.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 486.1, "r_x1": 414.7, "r_y1": 486.1, "r_x2": 414.7, "r_y2": 483.4, "r_x3": 412.8, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 491.0, "r_x1": 207.1, "r_y1": 491.0, "r_x2": 207.1, "r_y2": 488.3, "r_x3": 200.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 491.0, "r_x1": 369.8, "r_y1": 491.0, "r_x2": 369.8, "r_y2": 488.3, "r_x3": 367.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 491.0, "r_x1": 384.8, "r_y1": 491.0, "r_x2": 384.8, "r_y2": 488.3, "r_x3": 382.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 491.0, "r_x1": 402.1, "r_y1": 491.0, "r_x2": 402.1, "r_y2": 488.3, "r_x3": 397.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 495.9, "r_x1": 208.5, "r_y1": 495.9, "r_x2": 208.5, "r_y2": 493.2, "r_x3": 200.6, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 495.9, "r_x1": 266.3, "r_y1": 495.9, "r_x2": 266.3, "r_y2": 493.2, "r_x3": 264.3, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.9, "r_y0": 675.3, "r_x1": 230.1, "r_y1": 675.3, "r_x2": 230.1, "r_y2": 665.8, "r_x3": 227.9, "r_y3": 665.8, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.6, "r_y0": 693.4, "r_x1": 302.7, "r_y1": 693.4, "r_x2": 302.7, "r_y2": 683.6, "r_x3": 300.6, "r_y3": 683.6, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 7, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 144.0, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.83, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 144.0, "r_y1": 101.8, "r_x2": 144.0, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.84, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "caption", "bbox": { "l": 134.8, "t": 115.8, "r": 480.6, "b": 145.9, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 123.8, "r_x1": 173.1, "r_y1": 123.8, "r_x2": 173.1, "r_y2": 115.8, "r_x3": 134.8, "r_y3": 115.8, "coord_origin": "TOPLEFT" }, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.3, "r_y0": 124.0, "r_x1": 480.6, "r_y1": 124.0, "r_x2": 480.6, "r_y2": 115.9, "r_x3": 181.3, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 134.9, "r_x1": 480.6, "r_y1": 134.9, "r_x2": 480.6, "r_y2": 126.9, "r_x3": 134.8, "r_y3": 126.9, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 145.9, "r_x1": 306.0, "r_y1": 145.9, "r_x2": 306.0, "r_y2": 137.8, "r_x3": 134.8, "r_y3": 137.8, "coord_origin": "TOPLEFT" }, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "table", "bbox": { "l": 143.6, "t": 156.3, "r": 470.8, "b": 263.3, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.8, "r_y0": 174.6, "r_x1": 195.0, "r_y1": 174.6, "r_x2": 195.0, "r_y2": 166.6, "r_x3": 160.8, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.5, "r_y0": 174.6, "r_x1": 254.0, "r_y1": 174.6, "r_x2": 254.0, "r_y2": 166.5, "r_x3": 215.5, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.1, "r_x1": 324.0, "r_y1": 169.1, "r_x2": 324.0, "r_y2": 161.1, "r_x3": 300.4, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.3, "r_y0": 174.6, "r_x1": 414.7, "r_y1": 174.6, "r_x2": 414.7, "r_y2": 166.6, "r_x3": 370.3, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.7, "r_y0": 169.1, "r_x1": 463.1, "r_y1": 169.1, "r_x2": 463.1, "r_y2": 161.1, "r_x3": 426.7, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.1, "r_y0": 180.1, "r_x1": 466.7, "r_y1": 180.1, "r_x2": 466.7, "r_y2": 172.0, "r_x3": 423.1, "r_y3": 172.0, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.4, "r_y0": 182.1, "r_x1": 288.1, "r_y1": 182.1, "r_x2": 288.1, "r_y2": 174.0, "r_x3": 262.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.4, "r_y0": 182.1, "r_x1": 329.4, "r_y1": 182.1, "r_x2": 329.4, "r_y2": 174.0, "r_x3": 296.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.0, "r_y0": 182.1, "r_x1": 354.8, "r_y1": 182.1, "r_x2": 354.8, "r_y2": 174.0, "r_x3": 345.0, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 200.9, "r_x1": 201.2, "r_y1": 200.9, "r_x2": 201.2, "r_y2": 192.9, "r_x3": 154.5, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 195.5, "r_x1": 247.1, "r_y1": 195.5, "r_x2": 247.1, "r_y2": 187.4, "r_x3": 222.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 195.5, "r_x1": 285.7, "r_y1": 195.5, "r_x2": 285.7, "r_y2": 187.4, "r_x3": 264.7, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 195.5, "r_x1": 323.4, "r_y1": 195.5, "r_x2": 323.4, "r_y2": 187.4, "r_x3": 302.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.5, "r_x1": 360.4, "r_y1": 195.5, "r_x2": 360.4, "r_y2": 187.4, "r_x3": 339.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.1, "r_y0": 195.2, "r_x1": 402.0, "r_y1": 195.2, "r_x2": 402.0, "r_y2": 187.3, "r_x3": 383.1, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 195.2, "r_x1": 454.4, "r_y1": 195.2, "r_x2": 454.4, "r_y2": 187.3, "r_x3": 435.5, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.7, "r_y1": 208.4, "r_x2": 248.7, "r_y2": 200.3, "r_x3": 220.9, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 208.4, "r_x1": 285.7, "r_y1": 208.4, "r_x2": 285.7, "r_y2": 200.3, "r_x3": 264.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 208.4, "r_x1": 323.4, "r_y1": 208.4, "r_x2": 323.4, "r_y2": 200.3, "r_x3": 302.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.4, "r_y1": 208.4, "r_x2": 360.4, "r_y2": 200.3, "r_x3": 339.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 208.4, "r_x1": 403.0, "r_y1": 208.4, "r_x2": 403.0, "r_y2": 200.3, "r_x3": 382.1, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 208.4, "r_x1": 453.1, "r_y1": 208.4, "r_x2": 453.1, "r_y2": 200.3, "r_x3": 436.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.9, "r_y0": 227.2, "r_x1": 199.8, "r_y1": 227.2, "r_x2": 199.8, "r_y2": 219.2, "r_x3": 155.9, "r_y3": 219.2, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 221.8, "r_x1": 247.1, "r_y1": 221.8, "r_x2": 247.1, "r_y2": 213.7, "r_x3": 222.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 221.8, "r_x1": 285.7, "r_y1": 221.8, "r_x2": 285.7, "r_y2": 213.7, "r_x3": 264.7, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 221.8, "r_x1": 323.4, "r_y1": 221.8, "r_x2": 323.4, "r_y2": 213.7, "r_x3": 302.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 221.5, "r_x1": 362.0, "r_y1": 221.5, "r_x2": 362.0, "r_y2": 213.6, "r_x3": 337.8, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 221.5, "r_x1": 404.6, "r_y1": 221.5, "r_x2": 404.6, "r_y2": 213.6, "r_x3": 380.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 221.5, "r_x1": 454.4, "r_y1": 221.5, "r_x2": 454.4, "r_y2": 213.6, "r_x3": 435.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.7, "r_y1": 234.7, "r_x2": 248.7, "r_y2": 226.6, "r_x3": 220.9, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 234.7, "r_x1": 285.7, "r_y1": 234.7, "r_x2": 285.7, "r_y2": 226.6, "r_x3": 264.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 234.7, "r_x1": 323.4, "r_y1": 234.7, "r_x2": 323.4, "r_y2": 226.6, "r_x3": 302.4, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.7, "r_y0": 234.7, "r_x1": 358.1, "r_y1": 234.7, "r_x2": 358.1, "r_y2": 226.6, "r_x3": 341.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 234.7, "r_x1": 403.0, "r_y1": 234.7, "r_x2": 403.0, "r_y2": 226.6, "r_x3": 382.1, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 234.7, "r_x1": 453.1, "r_y1": 234.7, "r_x2": 453.1, "r_y2": 226.6, "r_x3": 436.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.6, "r_y0": 253.5, "r_x1": 207.2, "r_y1": 253.5, "r_x2": 207.2, "r_y2": 245.5, "r_x3": 148.6, "r_y3": 245.5, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 248.1, "r_x1": 247.1, "r_y1": 248.1, "r_x2": 247.1, "r_y2": 240.0, "r_x3": 222.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 248.1, "r_x1": 285.7, "r_y1": 248.1, "r_x2": 285.7, "r_y2": 240.0, "r_x3": 264.7, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 248.1, "r_x1": 323.4, "r_y1": 248.1, "r_x2": 323.4, "r_y2": 240.0, "r_x3": 302.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 247.8, "r_x1": 362.0, "r_y1": 247.8, "r_x2": 362.0, "r_y2": 239.9, "r_x3": 337.8, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 247.8, "r_x1": 404.6, "r_y1": 247.8, "r_x2": 404.6, "r_y2": 239.9, "r_x3": 380.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 247.8, "r_x1": 454.4, "r_y1": 247.8, "r_x2": 454.4, "r_y2": 239.9, "r_x3": 435.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.7, "r_y1": 261.0, "r_x2": 248.7, "r_y2": 252.9, "r_x3": 220.9, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 261.0, "r_x1": 285.7, "r_y1": 261.0, "r_x2": 285.7, "r_y2": 252.9, "r_x3": 264.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 261.0, "r_x1": 323.4, "r_y1": 261.0, "r_x2": 323.4, "r_y2": 252.9, "r_x3": 302.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.4, "r_y1": 261.0, "r_x2": 360.4, "r_y2": 252.9, "r_x3": 339.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 261.0, "r_x1": 403.0, "r_y1": 261.0, "r_x2": 403.0, "r_y2": 252.9, "r_x3": 382.1, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 261.0, "r_x1": 453.1, "r_y1": 261.0, "r_x2": 453.1, "r_y2": 252.9, "r_x3": 436.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 10, "label": "text", "bbox": { "l": 160.8, "t": 166.6, "r": 195.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.8, "r_y0": 174.6, "r_x1": 195.0, "r_y1": 174.6, "r_x2": 195.0, "r_y2": 166.6, "r_x3": 160.8, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 215.5, "t": 166.5, "r": 254.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.5, "r_y0": 174.6, "r_x1": 254.0, "r_y1": 174.6, "r_x2": 254.0, "r_y2": 166.5, "r_x3": 215.5, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 300.4, "t": 161.1, "r": 324.0, "b": 169.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.1, "r_x1": 324.0, "r_y1": 169.1, "r_x2": 324.0, "r_y2": 161.1, "r_x3": 300.4, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 370.3, "t": 166.6, "r": 414.7, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.3, "r_y0": 174.6, "r_x1": 414.7, "r_y1": 174.6, "r_x2": 414.7, "r_y2": 166.6, "r_x3": 370.3, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 426.7, "t": 161.1, "r": 463.1, "b": 169.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.7, "r_y0": 169.1, "r_x1": 463.1, "r_y1": 169.1, "r_x2": 463.1, "r_y2": 161.1, "r_x3": 426.7, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 423.1, "t": 172.0, "r": 466.7, "b": 180.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.1, "r_y0": 180.1, "r_x1": 466.7, "r_y1": 180.1, "r_x2": 466.7, "r_y2": 172.0, "r_x3": 423.1, "r_y3": 172.0, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 262.4, "t": 174.0, "r": 288.1, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.4, "r_y0": 182.1, "r_x1": 288.1, "r_y1": 182.1, "r_x2": 288.1, "r_y2": 174.0, "r_x3": 262.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 296.4, "t": 174.0, "r": 329.4, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.4, "r_y0": 182.1, "r_x1": 329.4, "r_y1": 182.1, "r_x2": 329.4, "r_y2": 174.0, "r_x3": 296.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 345.0, "t": 174.0, "r": 354.8, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.0, "r_y0": 182.1, "r_x1": 354.8, "r_y1": 182.1, "r_x2": 354.8, "r_y2": 174.0, "r_x3": 345.0, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 154.5, "t": 192.9, "r": 201.2, "b": 200.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 200.9, "r_x1": 201.2, "r_y1": 200.9, "r_x2": 201.2, "r_y2": 192.9, "r_x3": 154.5, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 222.4, "t": 187.4, "r": 247.1, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 195.5, "r_x1": 247.1, "r_y1": 195.5, "r_x2": 247.1, "r_y2": 187.4, "r_x3": 222.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 264.7, "t": 187.4, "r": 285.7, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 195.5, "r_x1": 285.7, "r_y1": 195.5, "r_x2": 285.7, "r_y2": 187.4, "r_x3": 264.7, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 302.4, "t": 187.4, "r": 323.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 195.5, "r_x1": 323.4, "r_y1": 195.5, "r_x2": 323.4, "r_y2": 187.4, "r_x3": 302.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 339.4, "t": 187.4, "r": 360.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.5, "r_x1": 360.4, "r_y1": 195.5, "r_x2": 360.4, "r_y2": 187.4, "r_x3": 339.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 383.1, "t": 187.3, "r": 402.0, "b": 195.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.1, "r_y0": 195.2, "r_x1": 402.0, "r_y1": 195.2, "r_x2": 402.0, "r_y2": 187.3, "r_x3": 383.1, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 435.5, "t": 187.3, "r": 454.4, "b": 195.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 195.2, "r_x1": 454.4, "r_y1": 195.2, "r_x2": 454.4, "r_y2": 187.3, "r_x3": 435.5, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 220.9, "t": 200.3, "r": 248.7, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.7, "r_y1": 208.4, "r_x2": 248.7, "r_y2": 200.3, "r_x3": 220.9, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 264.7, "t": 200.3, "r": 285.7, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 208.4, "r_x1": 285.7, "r_y1": 208.4, "r_x2": 285.7, "r_y2": 200.3, "r_x3": 264.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 302.4, "t": 200.3, "r": 323.4, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 208.4, "r_x1": 323.4, "r_y1": 208.4, "r_x2": 323.4, "r_y2": 200.3, "r_x3": 302.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 339.4, "t": 200.3, "r": 360.4, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.4, "r_y1": 208.4, "r_x2": 360.4, "r_y2": 200.3, "r_x3": 339.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 382.1, "t": 200.3, "r": 403.0, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 208.4, "r_x1": 403.0, "r_y1": 208.4, "r_x2": 403.0, "r_y2": 200.3, "r_x3": 382.1, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 436.7, "t": 200.3, "r": 453.1, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 208.4, "r_x1": 453.1, "r_y1": 208.4, "r_x2": 453.1, "r_y2": 200.3, "r_x3": 436.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 155.9, "t": 219.2, "r": 199.8, "b": 227.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.9, "r_y0": 227.2, "r_x1": 199.8, "r_y1": 227.2, "r_x2": 199.8, "r_y2": 219.2, "r_x3": 155.9, "r_y3": 219.2, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 222.4, "t": 213.7, "r": 247.1, "b": 221.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 221.8, "r_x1": 247.1, "r_y1": 221.8, "r_x2": 247.1, "r_y2": 213.7, "r_x3": 222.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 264.7, "t": 213.7, "r": 285.7, "b": 221.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 221.8, "r_x1": 285.7, "r_y1": 221.8, "r_x2": 285.7, "r_y2": 213.7, "r_x3": 264.7, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 302.4, "t": 213.7, "r": 323.4, "b": 221.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 221.8, "r_x1": 323.4, "r_y1": 221.8, "r_x2": 323.4, "r_y2": 213.7, "r_x3": 302.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 337.8, "t": 213.6, "r": 362.0, "b": 221.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 221.5, "r_x1": 362.0, "r_y1": 221.5, "r_x2": 362.0, "r_y2": 213.6, "r_x3": 337.8, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 380.5, "t": 213.6, "r": 404.6, "b": 221.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 221.5, "r_x1": 404.6, "r_y1": 221.5, "r_x2": 404.6, "r_y2": 213.6, "r_x3": 380.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 435.5, "t": 213.6, "r": 454.4, "b": 221.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 221.5, "r_x1": 454.4, "r_y1": 221.5, "r_x2": 454.4, "r_y2": 213.6, "r_x3": 435.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 220.9, "t": 226.6, "r": 248.7, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.7, "r_y1": 234.7, "r_x2": 248.7, "r_y2": 226.6, "r_x3": 220.9, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 264.7, "t": 226.6, "r": 285.7, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 234.7, "r_x1": 285.7, "r_y1": 234.7, "r_x2": 285.7, "r_y2": 226.6, "r_x3": 264.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 302.4, "t": 226.6, "r": 323.4, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 234.7, "r_x1": 323.4, "r_y1": 234.7, "r_x2": 323.4, "r_y2": 226.6, "r_x3": 302.4, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 341.7, "t": 226.6, "r": 358.1, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.7, "r_y0": 234.7, "r_x1": 358.1, "r_y1": 234.7, "r_x2": 358.1, "r_y2": 226.6, "r_x3": 341.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 382.1, "t": 226.6, "r": 403.0, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 234.7, "r_x1": 403.0, "r_y1": 234.7, "r_x2": 403.0, "r_y2": 226.6, "r_x3": 382.1, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 436.7, "t": 226.6, "r": 453.1, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 234.7, "r_x1": 453.1, "r_y1": 234.7, "r_x2": 453.1, "r_y2": 226.6, "r_x3": 436.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 148.6, "t": 245.5, "r": 207.2, "b": 253.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.6, "r_y0": 253.5, "r_x1": 207.2, "r_y1": 253.5, "r_x2": 207.2, "r_y2": 245.5, "r_x3": 148.6, "r_y3": 245.5, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 222.4, "t": 240.0, "r": 247.1, "b": 248.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 248.1, "r_x1": 247.1, "r_y1": 248.1, "r_x2": 247.1, "r_y2": 240.0, "r_x3": 222.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 264.7, "t": 240.0, "r": 285.7, "b": 248.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 248.1, "r_x1": 285.7, "r_y1": 248.1, "r_x2": 285.7, "r_y2": 240.0, "r_x3": 264.7, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 302.4, "t": 240.0, "r": 323.4, "b": 248.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 248.1, "r_x1": 323.4, "r_y1": 248.1, "r_x2": 323.4, "r_y2": 240.0, "r_x3": 302.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 337.8, "t": 239.9, "r": 362.0, "b": 247.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 247.8, "r_x1": 362.0, "r_y1": 247.8, "r_x2": 362.0, "r_y2": 239.9, "r_x3": 337.8, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 380.5, "t": 239.9, "r": 404.6, "b": 247.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 247.8, "r_x1": 404.6, "r_y1": 247.8, "r_x2": 404.6, "r_y2": 239.9, "r_x3": 380.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 435.5, "t": 239.9, "r": 454.4, "b": 247.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 247.8, "r_x1": 454.4, "r_y1": 247.8, "r_x2": 454.4, "r_y2": 239.9, "r_x3": 435.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 220.9, "t": 252.9, "r": 248.7, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.7, "r_y1": 261.0, "r_x2": 248.7, "r_y2": 252.9, "r_x3": 220.9, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 264.7, "t": 252.9, "r": 285.7, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 261.0, "r_x1": 285.7, "r_y1": 261.0, "r_x2": 285.7, "r_y2": 252.9, "r_x3": 264.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 302.4, "t": 252.9, "r": 323.4, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 261.0, "r_x1": 323.4, "r_y1": 261.0, "r_x2": 323.4, "r_y2": 252.9, "r_x3": 302.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 339.4, "t": 252.9, "r": 360.4, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.4, "r_y1": 261.0, "r_x2": 360.4, "r_y2": 252.9, "r_x3": 339.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 382.1, "t": 252.9, "r": 403.0, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 261.0, "r_x1": 403.0, "r_y1": 261.0, "r_x2": 403.0, "r_y2": 252.9, "r_x3": 382.1, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 436.7, "t": 252.9, "r": 453.1, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 261.0, "r_x1": 453.1, "r_y1": 261.0, "r_x2": 453.1, "r_y2": 252.9, "r_x3": 436.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 3, "label": "section_header", "bbox": { "l": 134.8, "t": 288.9, "r": 257.1, "b": 297.7, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 297.7, "r_x1": 149.4, "r_y1": 297.7, "r_x2": 149.4, "r_y2": 288.9, "r_x3": 134.8, "r_y3": 288.9, "coord_origin": "TOPLEFT" }, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 297.7, "r_x1": 257.1, "r_y1": 297.7, "r_x2": 257.1, "r_y2": 288.9, "r_x3": 160.9, "r_y3": 288.9, "coord_origin": "TOPLEFT" }, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 309.9, "r": 480.6, "b": 366.5, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 318.7, "r_x1": 480.6, "r_y1": 318.7, "r_x2": 480.6, "r_y2": 309.9, "r_x3": 134.8, "r_y3": 309.9, "coord_origin": "TOPLEFT" }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "orig": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 330.6, "r_x1": 480.6, "r_y1": 330.6, "r_x2": 480.6, "r_y2": 321.8, "r_x3": 134.8, "r_y3": 321.8, "coord_origin": "TOPLEFT" }, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 342.6, "r_x1": 480.6, "r_y1": 342.6, "r_x2": 480.6, "r_y2": 333.8, "r_x3": 134.8, "r_y3": 333.8, "coord_origin": "TOPLEFT" }, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 354.5, "r_x1": 480.6, "r_y1": 354.5, "r_x2": 480.6, "r_y2": 345.7, "r_x3": 134.8, "r_y3": 345.7, "coord_origin": "TOPLEFT" }, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 366.5, "r_x1": 161.7, "r_y1": 366.5, "r_x2": 161.7, "r_y2": 357.7, "r_x3": 134.8, "r_y3": 357.7, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "caption", "bbox": { "l": 134.8, "t": 397.6, "r": 480.6, "b": 439.7, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 405.5, "r_x1": 162.6, "r_y1": 405.5, "r_x2": 162.6, "r_y2": 397.6, "r_x3": 134.8, "r_y3": 397.6, "coord_origin": "TOPLEFT" }, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.4, "r_y0": 405.7, "r_x1": 480.6, "r_y1": 405.7, "r_x2": 480.6, "r_y2": 397.7, "r_x3": 167.4, "r_y3": 397.7, "coord_origin": "TOPLEFT" }, "text": "The OTSL model produces more accurate bounding boxes with less over-", "orig": "The OTSL model produces more accurate bounding boxes with less over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 416.7, "r_x1": 480.6, "r_y1": 416.7, "r_x2": 480.6, "r_y2": 408.6, "r_x3": 134.8, "r_y3": 408.6, "coord_origin": "TOPLEFT" }, "text": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 427.6, "r_x1": 480.6, "r_y1": 427.6, "r_x2": 480.6, "r_y2": 419.6, "r_x3": 134.8, "r_y3": 419.6, "coord_origin": "TOPLEFT" }, "text": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "orig": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 438.6, "r_x1": 304.7, "r_y1": 438.6, "r_x2": 304.7, "r_y2": 430.5, "r_x3": 134.8, "r_y3": 430.5, "coord_origin": "TOPLEFT" }, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 342.6, "r_y0": 439.7, "r_x1": 344.8, "r_y1": 439.7, "r_x2": 344.8, "r_y2": 430.2, "r_x3": 342.6, "r_y3": 430.2, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "picture", "bbox": { "l": 162.7, "t": 444.6, "r": 451.7, "b": 663.2, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 518.9, "r_x1": 190.6, "r_y1": 518.9, "r_x2": 190.6, "r_y2": 516.2, "r_x3": 180.1, "r_y3": 516.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 522.8, "r_x1": 304.5, "r_y1": 522.8, "r_x2": 304.5, "r_y2": 520.1, "r_x3": 183.2, "r_y3": 520.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 526.7, "r_x1": 388.4, "r_y1": 526.7, "r_x2": 388.4, "r_y2": 524.0, "r_x3": 183.2, "r_y3": 524.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 530.6, "r_x1": 388.4, "r_y1": 530.6, "r_x2": 388.4, "r_y2": 527.9, "r_x3": 183.2, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 534.5, "r_x1": 388.4, "r_y1": 534.5, "r_x2": 388.4, "r_y2": 531.8, "r_x3": 183.2, "r_y3": 531.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 538.4, "r_x1": 388.4, "r_y1": 538.4, "r_x2": 388.4, "r_y2": 535.7, "r_x3": 183.2, "r_y3": 535.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 542.3, "r_x1": 388.4, "r_y1": 542.3, "r_x2": 388.4, "r_y2": 539.6, "r_x3": 183.2, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 546.2, "r_x1": 388.4, "r_y1": 546.2, "r_x2": 388.4, "r_y2": 543.5, "r_x3": 183.2, "r_y3": 543.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 550.1, "r_x1": 388.4, "r_y1": 550.1, "r_x2": 388.4, "r_y2": 547.4, "r_x3": 183.2, "r_y3": 547.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 554.0, "r_x1": 388.4, "r_y1": 554.0, "r_x2": 388.4, "r_y2": 551.3, "r_x3": 183.2, "r_y3": 551.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 557.9, "r_x1": 191.9, "r_y1": 557.9, "r_x2": 191.9, "r_y2": 555.2, "r_x3": 180.1, "r_y3": 555.2, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 521.0, "r_x1": 408.8, "r_y1": 521.0, "r_x2": 408.8, "r_y2": 518.3, "r_x3": 407.4, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 521.0, "r_x1": 450.5, "r_y1": 521.0, "r_x2": 450.5, "r_y2": 518.3, "r_x3": 410.3, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 524.9, "r_x1": 408.8, "r_y1": 524.9, "r_x2": 408.8, "r_y2": 522.2, "r_x3": 407.4, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 524.9, "r_x1": 450.5, "r_y1": 524.9, "r_x2": 450.5, "r_y2": 522.2, "r_x3": 410.3, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 528.8, "r_x1": 408.8, "r_y1": 528.8, "r_x2": 408.8, "r_y2": 526.1, "r_x3": 407.4, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 528.8, "r_x1": 450.5, "r_y1": 528.8, "r_x2": 450.5, "r_y2": 526.1, "r_x3": 410.3, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 532.7, "r_x1": 408.8, "r_y1": 532.7, "r_x2": 408.8, "r_y2": 530.0, "r_x3": 407.4, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 532.7, "r_x1": 450.5, "r_y1": 532.7, "r_x2": 450.5, "r_y2": 530.0, "r_x3": 410.3, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 536.6, "r_x1": 408.8, "r_y1": 536.6, "r_x2": 408.8, "r_y2": 533.9, "r_x3": 407.4, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 536.6, "r_x1": 450.5, "r_y1": 536.6, "r_x2": 450.5, "r_y2": 533.9, "r_x3": 410.3, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 540.5, "r_x1": 408.8, "r_y1": 540.5, "r_x2": 408.8, "r_y2": 537.8, "r_x3": 407.4, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 540.5, "r_x1": 450.5, "r_y1": 540.5, "r_x2": 450.5, "r_y2": 537.8, "r_x3": 410.3, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 544.4, "r_x1": 408.8, "r_y1": 544.4, "r_x2": 408.8, "r_y2": 541.7, "r_x3": 407.4, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 544.4, "r_x1": 450.5, "r_y1": 544.4, "r_x2": 450.5, "r_y2": 541.7, "r_x3": 410.3, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 548.3, "r_x1": 408.8, "r_y1": 548.3, "r_x2": 408.8, "r_y2": 545.6, "r_x3": 407.4, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 548.3, "r_x1": 450.5, "r_y1": 548.3, "r_x2": 450.5, "r_y2": 545.6, "r_x3": 410.3, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 552.2, "r_x1": 408.8, "r_y1": 552.2, "r_x2": 408.8, "r_y2": 549.5, "r_x3": 407.4, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 552.2, "r_x1": 450.5, "r_y1": 552.2, "r_x2": 450.5, "r_y2": 549.5, "r_x3": 410.3, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.5, "r_y0": 515.3, "r_x1": 181.9, "r_y1": 515.3, "r_x2": 181.9, "r_y2": 509.5, "r_x3": 164.5, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.6, "r_y0": 515.3, "r_x1": 186.4, "r_y1": 515.3, "r_x2": 186.4, "r_y2": 509.5, "r_x3": 183.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2, "r_y0": 515.3, "r_x1": 208.9, "r_y1": 515.3, "r_x2": 208.9, "r_y2": 509.5, "r_x3": 189.2, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.6, "r_y0": 515.3, "r_x1": 221.0, "r_y1": 515.3, "r_x2": 221.0, "r_y2": 509.5, "r_x3": 210.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.5, "r_x1": 406.8, "r_y1": 515.5, "r_x2": 406.8, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.6, "r_y0": 515.5, "r_x1": 411.4, "r_y1": 515.5, "r_x2": 411.4, "r_y2": 509.6, "r_x3": 408.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.5, "r_x1": 433.9, "r_y1": 515.5, "r_x2": 433.9, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 515.5, "r_x1": 446.0, "r_y1": 515.5, "r_x2": 446.0, "r_y2": 509.6, "r_x3": 435.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.2, "r_y0": 526.4, "r_x1": 172.8, "r_y1": 526.4, "r_x2": 172.8, "r_y2": 519.1, "r_x3": 167.2, "r_y3": 519.1, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.3, "r_y0": 455.9, "r_x1": 193.0, "r_y1": 455.9, "r_x2": 193.0, "r_y2": 448.6, "r_x3": 187.3, "r_y3": 448.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.4, "r_y0": 573.3, "r_x1": 173.0, "r_y1": 573.3, "r_x2": 173.0, "r_y2": 566.0, "r_x3": 167.4, "r_y3": 566.0, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.5, "r_y0": 629.1, "r_x1": 253.7, "r_y1": 629.1, "r_x2": 253.7, "r_y2": 621.8, "r_x3": 248.5, "r_y3": 621.8, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.5, "r_x1": 401.5, "r_y1": 526.5, "r_x2": 401.5, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.6, "r_y0": 597.3, "r_x1": 177.5, "r_y1": 597.3, "r_x2": 177.5, "r_y2": 580.3, "r_x3": 171.6, "r_y3": 580.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.1, "r_y0": 649.9, "r_x1": 256.9, "r_y1": 649.9, "r_x2": 256.9, "r_y2": 633.6, "r_x3": 251.1, "r_y3": 633.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 607.3, "r_x1": 427.0, "r_y1": 607.3, "r_x2": 427.0, "r_y2": 601.5, "r_x3": 372.1, "r_y3": 601.5, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 613.8, "r_x1": 430.1, "r_y1": 613.8, "r_x2": 430.1, "r_y2": 607.9, "r_x3": 372.1, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 648.7, "r_x1": 231.1, "r_y1": 648.7, "r_x2": 231.1, "r_y2": 642.9, "r_x3": 176.9, "r_y3": 642.9, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 655.2, "r_x1": 231.0, "r_y1": 655.2, "r_x2": 231.0, "r_y2": 649.3, "r_x3": 176.9, "r_y3": 649.3, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 661.6, "r_x1": 203.9, "r_y1": 661.6, "r_x2": 203.9, "r_y2": 655.8, "r_x3": 176.9, "r_y3": 655.8, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.9, "r_y0": 569.2, "r_x1": 218.5, "r_y1": 569.2, "r_x2": 218.5, "r_y2": 557.6, "r_x3": 215.9, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.1, "r_y0": 569.2, "r_x1": 231.7, "r_y1": 569.2, "r_x2": 231.7, "r_y2": 557.6, "r_x3": 229.1, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.2, "r_y0": 451.2, "r_x1": 263.6, "r_y1": 451.2, "r_x2": 263.6, "r_y2": 448.5, "r_x3": 261.2, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.3, "r_y0": 451.2, "r_x1": 313.6, "r_y1": 451.2, "r_x2": 313.6, "r_y2": 448.5, "r_x3": 312.3, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.4, "r_y0": 451.2, "r_x1": 380.1, "r_y1": 451.2, "r_x2": 380.1, "r_y2": 448.5, "r_x3": 377.4, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 456.1, "r_x1": 205.8, "r_y1": 456.1, "r_x2": 205.8, "r_y2": 453.3, "r_x3": 200.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.2, "r_y0": 456.1, "r_x1": 229.8, "r_y1": 456.1, "r_x2": 229.8, "r_y2": 453.3, "r_x3": 222.2, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 456.1, "r_x1": 250.8, "r_y1": 456.1, "r_x2": 250.8, "r_y2": 453.3, "r_x3": 243.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.1, "r_x1": 271.8, "r_y1": 456.1, "r_x2": 271.8, "r_y2": 453.3, "r_x3": 264.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.3, "r_y0": 456.1, "r_x1": 292.9, "r_y1": 456.1, "r_x2": 292.9, "r_y2": 453.3, "r_x3": 285.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 456.1, "r_x1": 311.8, "r_y1": 456.1, "r_x2": 311.8, "r_y2": 453.3, "r_x3": 306.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 456.1, "r_x1": 325.6, "r_y1": 456.1, "r_x2": 325.6, "r_y2": 453.3, "r_x3": 323.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 456.1, "r_x1": 336.6, "r_y1": 456.1, "r_x2": 336.6, "r_y2": 453.3, "r_x3": 334.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 456.1, "r_x1": 347.7, "r_y1": 456.1, "r_x2": 347.7, "r_y2": 453.3, "r_x3": 345.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 456.1, "r_x1": 358.7, "r_y1": 456.1, "r_x2": 358.7, "r_y2": 453.3, "r_x3": 356.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 456.1, "r_x1": 372.0, "r_y1": 456.1, "r_x2": 372.0, "r_y2": 453.3, "r_x3": 367.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 456.1, "r_x1": 387.0, "r_y1": 456.1, "r_x2": 387.0, "r_y2": 453.3, "r_x3": 382.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 456.1, "r_x1": 402.1, "r_y1": 456.1, "r_x2": 402.1, "r_y2": 453.3, "r_x3": 397.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 457.8, "r_x1": 414.9, "r_y1": 457.8, "r_x2": 414.9, "r_y2": 448.0, "r_x3": 412.8, "r_y3": 448.0, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.0, "r_y0": 456.1, "r_x1": 422.5, "r_y1": 456.1, "r_x2": 422.5, "r_y2": 453.3, "r_x3": 415.0, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 466.7, "r_x1": 204.6, "r_y1": 466.7, "r_x2": 204.6, "r_y2": 463.9, "r_x3": 200.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 466.7, "r_x1": 369.6, "r_y1": 466.7, "r_x2": 369.6, "r_y2": 463.9, "r_x3": 367.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 466.7, "r_x1": 384.6, "r_y1": 466.7, "r_x2": 384.6, "r_y2": 463.9, "r_x3": 382.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 466.7, "r_x1": 399.7, "r_y1": 466.7, "r_x2": 399.7, "r_y2": 463.9, "r_x3": 397.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 471.5, "r_x1": 206.5, "r_y1": 471.5, "r_x2": 206.5, "r_y2": 468.8, "r_x3": 200.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 471.5, "r_x1": 266.3, "r_y1": 471.5, "r_x2": 266.3, "r_y2": 468.8, "r_x3": 264.3, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 471.5, "r_x1": 308.3, "r_y1": 471.5, "r_x2": 308.3, "r_y2": 468.8, "r_x3": 306.4, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 471.5, "r_x1": 347.5, "r_y1": 471.5, "r_x2": 347.5, "r_y2": 468.8, "r_x3": 345.5, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 471.5, "r_x1": 358.5, "r_y1": 471.5, "r_x2": 358.5, "r_y2": 468.8, "r_x3": 356.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 471.5, "r_x1": 369.6, "r_y1": 471.5, "r_x2": 369.6, "r_y2": 468.8, "r_x3": 367.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 471.5, "r_x1": 384.6, "r_y1": 471.5, "r_x2": 384.6, "r_y2": 468.8, "r_x3": 382.7, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 476.4, "r_x1": 206.5, "r_y1": 476.4, "r_x2": 206.5, "r_y2": 473.7, "r_x3": 200.6, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 476.4, "r_x1": 266.3, "r_y1": 476.4, "r_x2": 266.3, "r_y2": 473.7, "r_x3": 264.3, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 481.3, "r_x1": 206.5, "r_y1": 481.3, "r_x2": 206.5, "r_y2": 478.5, "r_x3": 200.6, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 481.3, "r_x1": 245.2, "r_y1": 481.3, "r_x2": 245.2, "r_y2": 478.5, "r_x3": 243.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 481.3, "r_x1": 266.3, "r_y1": 481.3, "r_x2": 266.3, "r_y2": 478.5, "r_x3": 264.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.3, "r_x1": 325.4, "r_y1": 481.3, "r_x2": 325.4, "r_y2": 478.5, "r_x3": 323.4, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 481.3, "r_x1": 399.7, "r_y1": 481.3, "r_x2": 399.7, "r_y2": 478.5, "r_x3": 397.7, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 486.1, "r_x1": 206.5, "r_y1": 486.1, "r_x2": 206.5, "r_y2": 483.4, "r_x3": 200.6, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 486.1, "r_x1": 384.6, "r_y1": 486.1, "r_x2": 384.6, "r_y2": 483.4, "r_x3": 382.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 486.1, "r_x1": 401.6, "r_y1": 486.1, "r_x2": 401.6, "r_y2": 483.4, "r_x3": 397.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 486.1, "r_x1": 414.7, "r_y1": 486.1, "r_x2": 414.7, "r_y2": 483.4, "r_x3": 412.8, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 491.0, "r_x1": 207.1, "r_y1": 491.0, "r_x2": 207.1, "r_y2": 488.3, "r_x3": 200.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 491.0, "r_x1": 369.8, "r_y1": 491.0, "r_x2": 369.8, "r_y2": 488.3, "r_x3": 367.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 491.0, "r_x1": 384.8, "r_y1": 491.0, "r_x2": 384.8, "r_y2": 488.3, "r_x3": 382.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 491.0, "r_x1": 402.1, "r_y1": 491.0, "r_x2": 402.1, "r_y2": 488.3, "r_x3": 397.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 495.9, "r_x1": 208.5, "r_y1": 495.9, "r_x2": 208.5, "r_y2": 493.2, "r_x3": 200.6, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 495.9, "r_x1": 266.3, "r_y1": 495.9, "r_x2": 266.3, "r_y2": 493.2, "r_x3": 264.3, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 58, "label": "text", "bbox": { "l": 180.1, "t": 516.2, "r": 190.6, "b": 518.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 518.9, "r_x1": 190.6, "r_y1": 518.9, "r_x2": 190.6, "r_y2": 516.2, "r_x3": 180.1, "r_y3": 516.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 183.2, "t": 520.1, "r": 304.5, "b": 522.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 522.8, "r_x1": 304.5, "r_y1": 522.8, "r_x2": 304.5, "r_y2": 520.1, "r_x3": 183.2, "r_y3": 520.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.2, "t": 524.0, "r": 388.4, "b": 526.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 526.7, "r_x1": 388.4, "r_y1": 526.7, "r_x2": 388.4, "r_y2": 524.0, "r_x3": 183.2, "r_y3": 524.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 183.2, "t": 527.9, "r": 388.4, "b": 530.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 530.6, "r_x1": 388.4, "r_y1": 530.6, "r_x2": 388.4, "r_y2": 527.9, "r_x3": 183.2, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 183.2, "t": 531.8, "r": 388.4, "b": 534.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 534.5, "r_x1": 388.4, "r_y1": 534.5, "r_x2": 388.4, "r_y2": 531.8, "r_x3": 183.2, "r_y3": 531.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 183.2, "t": 535.7, "r": 388.4, "b": 538.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 538.4, "r_x1": 388.4, "r_y1": 538.4, "r_x2": 388.4, "r_y2": 535.7, "r_x3": 183.2, "r_y3": 535.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 183.2, "t": 539.6, "r": 388.4, "b": 542.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 542.3, "r_x1": 388.4, "r_y1": 542.3, "r_x2": 388.4, "r_y2": 539.6, "r_x3": 183.2, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 183.2, "t": 543.5, "r": 388.4, "b": 546.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 546.2, "r_x1": 388.4, "r_y1": 546.2, "r_x2": 388.4, "r_y2": 543.5, "r_x3": 183.2, "r_y3": 543.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 183.2, "t": 547.4, "r": 388.4, "b": 550.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 550.1, "r_x1": 388.4, "r_y1": 550.1, "r_x2": 388.4, "r_y2": 547.4, "r_x3": 183.2, "r_y3": 547.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.2, "t": 551.3, "r": 388.4, "b": 554.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 554.0, "r_x1": 388.4, "r_y1": 554.0, "r_x2": 388.4, "r_y2": 551.3, "r_x3": 183.2, "r_y3": 551.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 180.1, "t": 555.2, "r": 191.9, "b": 557.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 557.9, "r_x1": 191.9, "r_y1": 557.9, "r_x2": 191.9, "r_y2": 555.2, "r_x3": 180.1, "r_y3": 555.2, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 407.4, "t": 518.3, "r": 408.8, "b": 521.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 521.0, "r_x1": 408.8, "r_y1": 521.0, "r_x2": 408.8, "r_y2": 518.3, "r_x3": 407.4, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 410.3, "t": 518.3, "r": 450.5, "b": 521.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 521.0, "r_x1": 450.5, "r_y1": 521.0, "r_x2": 450.5, "r_y2": 518.3, "r_x3": 410.3, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 407.4, "t": 522.2, "r": 408.8, "b": 524.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 524.9, "r_x1": 408.8, "r_y1": 524.9, "r_x2": 408.8, "r_y2": 522.2, "r_x3": 407.4, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 410.3, "t": 522.2, "r": 450.5, "b": 524.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 524.9, "r_x1": 450.5, "r_y1": 524.9, "r_x2": 450.5, "r_y2": 522.2, "r_x3": 410.3, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 407.4, "t": 526.1, "r": 408.8, "b": 528.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 528.8, "r_x1": 408.8, "r_y1": 528.8, "r_x2": 408.8, "r_y2": 526.1, "r_x3": 407.4, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 410.3, "t": 526.1, "r": 450.5, "b": 528.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 528.8, "r_x1": 450.5, "r_y1": 528.8, "r_x2": 450.5, "r_y2": 526.1, "r_x3": 410.3, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 407.4, "t": 530.0, "r": 408.8, "b": 532.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 532.7, "r_x1": 408.8, "r_y1": 532.7, "r_x2": 408.8, "r_y2": 530.0, "r_x3": 407.4, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 410.3, "t": 530.0, "r": 450.5, "b": 532.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 532.7, "r_x1": 450.5, "r_y1": 532.7, "r_x2": 450.5, "r_y2": 530.0, "r_x3": 410.3, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 407.4, "t": 533.9, "r": 408.8, "b": 536.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 536.6, "r_x1": 408.8, "r_y1": 536.6, "r_x2": 408.8, "r_y2": 533.9, "r_x3": 407.4, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 410.3, "t": 533.9, "r": 450.5, "b": 536.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 536.6, "r_x1": 450.5, "r_y1": 536.6, "r_x2": 450.5, "r_y2": 533.9, "r_x3": 410.3, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 407.4, "t": 537.8, "r": 408.8, "b": 540.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 540.5, "r_x1": 408.8, "r_y1": 540.5, "r_x2": 408.8, "r_y2": 537.8, "r_x3": 407.4, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 410.3, "t": 537.8, "r": 450.5, "b": 540.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 540.5, "r_x1": 450.5, "r_y1": 540.5, "r_x2": 450.5, "r_y2": 537.8, "r_x3": 410.3, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 407.4, "t": 541.7, "r": 408.8, "b": 544.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 544.4, "r_x1": 408.8, "r_y1": 544.4, "r_x2": 408.8, "r_y2": 541.7, "r_x3": 407.4, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 410.3, "t": 541.7, "r": 450.5, "b": 544.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 544.4, "r_x1": 450.5, "r_y1": 544.4, "r_x2": 450.5, "r_y2": 541.7, "r_x3": 410.3, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 407.4, "t": 545.6, "r": 408.8, "b": 548.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 548.3, "r_x1": 408.8, "r_y1": 548.3, "r_x2": 408.8, "r_y2": 545.6, "r_x3": 407.4, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 410.3, "t": 545.6, "r": 450.5, "b": 548.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 548.3, "r_x1": 450.5, "r_y1": 548.3, "r_x2": 450.5, "r_y2": 545.6, "r_x3": 410.3, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 407.4, "t": 549.5, "r": 408.8, "b": 552.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 552.2, "r_x1": 408.8, "r_y1": 552.2, "r_x2": 408.8, "r_y2": 549.5, "r_x3": 407.4, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 410.3, "t": 549.5, "r": 450.5, "b": 552.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 552.2, "r_x1": 450.5, "r_y1": 552.2, "r_x2": 450.5, "r_y2": 549.5, "r_x3": 410.3, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 164.5, "t": 509.5, "r": 181.9, "b": 515.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.5, "r_y0": 515.3, "r_x1": 181.9, "r_y1": 515.3, "r_x2": 181.9, "r_y2": 509.5, "r_x3": 164.5, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.6, "t": 509.5, "r": 186.4, "b": 515.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.6, "r_y0": 515.3, "r_x1": 186.4, "r_y1": 515.3, "r_x2": 186.4, "r_y2": 509.5, "r_x3": 183.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 189.2, "t": 509.5, "r": 208.9, "b": 515.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2, "r_y0": 515.3, "r_x1": 208.9, "r_y1": 515.3, "r_x2": 208.9, "r_y2": 509.5, "r_x3": 189.2, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 210.6, "t": 509.5, "r": 221.0, "b": 515.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.6, "r_y0": 515.3, "r_x1": 221.0, "r_y1": 515.3, "r_x2": 221.0, "r_y2": 509.5, "r_x3": 210.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 390.2, "t": 509.6, "r": 406.8, "b": 515.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.5, "r_x1": 406.8, "r_y1": 515.5, "r_x2": 406.8, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 408.6, "t": 509.6, "r": 411.4, "b": 515.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.6, "r_y0": 515.5, "r_x1": 411.4, "r_y1": 515.5, "r_x2": 411.4, "r_y2": 509.6, "r_x3": 408.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 414.2, "t": 509.6, "r": 433.9, "b": 515.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.5, "r_x1": 433.9, "r_y1": 515.5, "r_x2": 433.9, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 435.6, "t": 509.6, "r": 446.0, "b": 515.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 515.5, "r_x1": 446.0, "r_y1": 515.5, "r_x2": 446.0, "r_y2": 509.6, "r_x3": 435.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 167.2, "t": 519.1, "r": 172.8, "b": 526.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.2, "r_y0": 526.4, "r_x1": 172.8, "r_y1": 526.4, "r_x2": 172.8, "r_y2": 519.1, "r_x3": 167.2, "r_y3": 519.1, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 187.3, "t": 448.6, "r": 193.0, "b": 455.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.3, "r_y0": 455.9, "r_x1": 193.0, "r_y1": 455.9, "r_x2": 193.0, "r_y2": 448.6, "r_x3": 187.3, "r_y3": 448.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 167.4, "t": 566.0, "r": 173.0, "b": 573.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.4, "r_y0": 573.3, "r_x1": 173.0, "r_y1": 573.3, "r_x2": 173.0, "r_y2": 566.0, "r_x3": 167.4, "r_y3": 566.0, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 248.5, "t": 621.8, "r": 253.7, "b": 629.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.5, "r_y0": 629.1, "r_x1": 253.7, "r_y1": 629.1, "r_x2": 253.7, "r_y2": 621.8, "r_x3": 248.5, "r_y3": 621.8, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 395.9, "t": 519.2, "r": 401.5, "b": 526.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.5, "r_x1": 401.5, "r_y1": 526.5, "r_x2": 401.5, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 171.6, "t": 580.3, "r": 177.5, "b": 597.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.6, "r_y0": 597.3, "r_x1": 177.5, "r_y1": 597.3, "r_x2": 177.5, "r_y2": 580.3, "r_x3": 171.6, "r_y3": 580.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 251.1, "t": 633.6, "r": 256.9, "b": 649.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.1, "r_y0": 649.9, "r_x1": 256.9, "r_y1": 649.9, "r_x2": 256.9, "r_y2": 633.6, "r_x3": 251.1, "r_y3": 633.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 372.1, "t": 601.5, "r": 427.0, "b": 607.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 607.3, "r_x1": 427.0, "r_y1": 607.3, "r_x2": 427.0, "r_y2": 601.5, "r_x3": 372.1, "r_y3": 601.5, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 372.1, "t": 607.9, "r": 430.1, "b": 613.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 613.8, "r_x1": 430.1, "r_y1": 613.8, "r_x2": 430.1, "r_y2": 607.9, "r_x3": 372.1, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 176.9, "t": 642.9, "r": 231.1, "b": 648.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 648.7, "r_x1": 231.1, "r_y1": 648.7, "r_x2": 231.1, "r_y2": 642.9, "r_x3": 176.9, "r_y3": 642.9, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 176.9, "t": 649.3, "r": 231.0, "b": 655.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 655.2, "r_x1": 231.0, "r_y1": 655.2, "r_x2": 231.0, "r_y2": 649.3, "r_x3": 176.9, "r_y3": 649.3, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 176.9, "t": 655.8, "r": 203.9, "b": 661.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 661.6, "r_x1": 203.9, "r_y1": 661.6, "r_x2": 203.9, "r_y2": 655.8, "r_x3": 176.9, "r_y3": 655.8, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 215.9, "t": 557.6, "r": 218.5, "b": 569.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.9, "r_y0": 569.2, "r_x1": 218.5, "r_y1": 569.2, "r_x2": 218.5, "r_y2": 557.6, "r_x3": 215.9, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 229.1, "t": 557.6, "r": 231.7, "b": 569.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.1, "r_y0": 569.2, "r_x1": 231.7, "r_y1": 569.2, "r_x2": 231.7, "r_y2": 557.6, "r_x3": 229.1, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 261.2, "t": 448.5, "r": 263.6, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.2, "r_y0": 451.2, "r_x1": 263.6, "r_y1": 451.2, "r_x2": 263.6, "r_y2": 448.5, "r_x3": 261.2, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 312.3, "t": 448.5, "r": 313.6, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.3, "r_y0": 451.2, "r_x1": 313.6, "r_y1": 451.2, "r_x2": 313.6, "r_y2": 448.5, "r_x3": 312.3, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 377.4, "t": 448.5, "r": 380.1, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.4, "r_y0": 451.2, "r_x1": 380.1, "r_y1": 451.2, "r_x2": 380.1, "r_y2": 448.5, "r_x3": 377.4, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 200.6, "t": 453.3, "r": 205.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 456.1, "r_x1": 205.8, "r_y1": 456.1, "r_x2": 205.8, "r_y2": 453.3, "r_x3": 200.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 222.2, "t": 453.3, "r": 229.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.2, "r_y0": 456.1, "r_x1": 229.8, "r_y1": 456.1, "r_x2": 229.8, "r_y2": 453.3, "r_x3": 222.2, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 243.3, "t": 453.3, "r": 250.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 456.1, "r_x1": 250.8, "r_y1": 456.1, "r_x2": 250.8, "r_y2": 453.3, "r_x3": 243.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 264.3, "t": 453.3, "r": 271.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.1, "r_x1": 271.8, "r_y1": 456.1, "r_x2": 271.8, "r_y2": 453.3, "r_x3": 264.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 285.3, "t": 453.3, "r": 292.9, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.3, "r_y0": 456.1, "r_x1": 292.9, "r_y1": 456.1, "r_x2": 292.9, "r_y2": 453.3, "r_x3": 285.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 306.4, "t": 453.3, "r": 311.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 456.1, "r_x1": 311.8, "r_y1": 456.1, "r_x2": 311.8, "r_y2": 453.3, "r_x3": 306.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 323.4, "t": 453.3, "r": 325.6, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 456.1, "r_x1": 325.6, "r_y1": 456.1, "r_x2": 325.6, "r_y2": 453.3, "r_x3": 323.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 334.5, "t": 453.3, "r": 336.6, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 456.1, "r_x1": 336.6, "r_y1": 456.1, "r_x2": 336.6, "r_y2": 453.3, "r_x3": 334.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 345.5, "t": 453.3, "r": 347.7, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 456.1, "r_x1": 347.7, "r_y1": 456.1, "r_x2": 347.7, "r_y2": 453.3, "r_x3": 345.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 356.6, "t": 453.3, "r": 358.7, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 456.1, "r_x1": 358.7, "r_y1": 456.1, "r_x2": 358.7, "r_y2": 453.3, "r_x3": 356.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 367.6, "t": 453.3, "r": 372.0, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 456.1, "r_x1": 372.0, "r_y1": 456.1, "r_x2": 372.0, "r_y2": 453.3, "r_x3": 367.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 382.7, "t": 453.3, "r": 387.0, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 456.1, "r_x1": 387.0, "r_y1": 456.1, "r_x2": 387.0, "r_y2": 453.3, "r_x3": 382.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 397.7, "t": 453.3, "r": 402.1, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 456.1, "r_x1": 402.1, "r_y1": 456.1, "r_x2": 402.1, "r_y2": 453.3, "r_x3": 397.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 412.8, "t": 448.0, "r": 414.9, "b": 457.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 457.8, "r_x1": 414.9, "r_y1": 457.8, "r_x2": 414.9, "r_y2": 448.0, "r_x3": 412.8, "r_y3": 448.0, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 415.0, "t": 453.3, "r": 422.5, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.0, "r_y0": 456.1, "r_x1": 422.5, "r_y1": 456.1, "r_x2": 422.5, "r_y2": 453.3, "r_x3": 415.0, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 200.6, "t": 463.9, "r": 204.6, "b": 466.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 466.7, "r_x1": 204.6, "r_y1": 466.7, "r_x2": 204.6, "r_y2": 463.9, "r_x3": 200.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 367.6, "t": 463.9, "r": 369.6, "b": 466.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 466.7, "r_x1": 369.6, "r_y1": 466.7, "r_x2": 369.6, "r_y2": 463.9, "r_x3": 367.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 382.7, "t": 463.9, "r": 384.6, "b": 466.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 466.7, "r_x1": 384.6, "r_y1": 466.7, "r_x2": 384.6, "r_y2": 463.9, "r_x3": 382.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 397.7, "t": 463.9, "r": 399.7, "b": 466.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 466.7, "r_x1": 399.7, "r_y1": 466.7, "r_x2": 399.7, "r_y2": 463.9, "r_x3": 397.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 200.6, "t": 468.8, "r": 206.5, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 471.5, "r_x1": 206.5, "r_y1": 471.5, "r_x2": 206.5, "r_y2": 468.8, "r_x3": 200.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 264.3, "t": 468.8, "r": 266.3, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 471.5, "r_x1": 266.3, "r_y1": 471.5, "r_x2": 266.3, "r_y2": 468.8, "r_x3": 264.3, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 306.4, "t": 468.8, "r": 308.3, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 471.5, "r_x1": 308.3, "r_y1": 471.5, "r_x2": 308.3, "r_y2": 468.8, "r_x3": 306.4, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 345.5, "t": 468.8, "r": 347.5, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 471.5, "r_x1": 347.5, "r_y1": 471.5, "r_x2": 347.5, "r_y2": 468.8, "r_x3": 345.5, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 356.6, "t": 468.8, "r": 358.5, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 471.5, "r_x1": 358.5, "r_y1": 471.5, "r_x2": 358.5, "r_y2": 468.8, "r_x3": 356.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 367.6, "t": 468.8, "r": 369.6, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 471.5, "r_x1": 369.6, "r_y1": 471.5, "r_x2": 369.6, "r_y2": 468.8, "r_x3": 367.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 382.7, "t": 468.8, "r": 384.6, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 471.5, "r_x1": 384.6, "r_y1": 471.5, "r_x2": 384.6, "r_y2": 468.8, "r_x3": 382.7, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 200.6, "t": 473.7, "r": 206.5, "b": 476.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 476.4, "r_x1": 206.5, "r_y1": 476.4, "r_x2": 206.5, "r_y2": 473.7, "r_x3": 200.6, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 264.3, "t": 473.7, "r": 266.3, "b": 476.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 476.4, "r_x1": 266.3, "r_y1": 476.4, "r_x2": 266.3, "r_y2": 473.7, "r_x3": 264.3, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 200.6, "t": 478.5, "r": 206.5, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 481.3, "r_x1": 206.5, "r_y1": 481.3, "r_x2": 206.5, "r_y2": 478.5, "r_x3": 200.6, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 243.3, "t": 478.5, "r": 245.2, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 481.3, "r_x1": 245.2, "r_y1": 481.3, "r_x2": 245.2, "r_y2": 478.5, "r_x3": 243.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 264.3, "t": 478.5, "r": 266.3, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 481.3, "r_x1": 266.3, "r_y1": 481.3, "r_x2": 266.3, "r_y2": 478.5, "r_x3": 264.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 323.4, "t": 478.5, "r": 325.4, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.3, "r_x1": 325.4, "r_y1": 481.3, "r_x2": 325.4, "r_y2": 478.5, "r_x3": 323.4, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 397.7, "t": 478.5, "r": 399.7, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 481.3, "r_x1": 399.7, "r_y1": 481.3, "r_x2": 399.7, "r_y2": 478.5, "r_x3": 397.7, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 200.6, "t": 483.4, "r": 206.5, "b": 486.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 486.1, "r_x1": 206.5, "r_y1": 486.1, "r_x2": 206.5, "r_y2": 483.4, "r_x3": 200.6, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 382.7, "t": 483.4, "r": 384.6, "b": 486.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 486.1, "r_x1": 384.6, "r_y1": 486.1, "r_x2": 384.6, "r_y2": 483.4, "r_x3": 382.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 397.7, "t": 483.4, "r": 401.6, "b": 486.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 486.1, "r_x1": 401.6, "r_y1": 486.1, "r_x2": 401.6, "r_y2": 483.4, "r_x3": 397.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 412.8, "t": 483.4, "r": 414.7, "b": 486.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 486.1, "r_x1": 414.7, "r_y1": 486.1, "r_x2": 414.7, "r_y2": 483.4, "r_x3": 412.8, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 200.6, "t": 488.3, "r": 207.1, "b": 491.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 491.0, "r_x1": 207.1, "r_y1": 491.0, "r_x2": 207.1, "r_y2": 488.3, "r_x3": 200.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 367.6, "t": 488.3, "r": 369.8, "b": 491.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 491.0, "r_x1": 369.8, "r_y1": 491.0, "r_x2": 369.8, "r_y2": 488.3, "r_x3": 367.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 382.7, "t": 488.3, "r": 384.8, "b": 491.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 491.0, "r_x1": 384.8, "r_y1": 491.0, "r_x2": 384.8, "r_y2": 488.3, "r_x3": 382.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 397.7, "t": 488.3, "r": 402.1, "b": 491.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 491.0, "r_x1": 402.1, "r_y1": 491.0, "r_x2": 402.1, "r_y2": 488.3, "r_x3": 397.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 200.6, "t": 493.2, "r": 208.5, "b": 495.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 495.9, "r_x1": 208.5, "r_y1": 495.9, "r_x2": 208.5, "r_y2": 493.2, "r_x3": 200.6, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 264.3, "t": 493.2, "r": 266.3, "b": 495.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 495.9, "r_x1": 266.3, "r_y1": 495.9, "r_x2": 266.3, "r_y2": 493.2, "r_x3": 264.3, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 155, "label": "text", "bbox": { "l": 227.9, "t": 665.8, "r": 230.1, "b": 675.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.9, "r_y0": 675.3, "r_x1": 230.1, "r_y1": 675.3, "r_x2": 230.1, "r_y2": 665.8, "r_x3": 227.9, "r_y3": 665.8, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 156, "label": "text", "bbox": { "l": 300.6, "t": 683.6, "r": 302.7, "b": 693.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.6, "r_y0": 693.4, "r_x1": 302.7, "r_y1": 693.4, "r_x2": 302.7, "r_y2": 683.6, "r_x3": 300.6, "r_y3": 683.6, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": { "0": { "label": "table", "id": 0, "page_no": 9, "cluster": { "id": 0, "label": "table", "bbox": { "l": 143.6, "t": 156.3, "r": 470.8, "b": 263.3, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.8, "r_y0": 174.6, "r_x1": 195.0, "r_y1": 174.6, "r_x2": 195.0, "r_y2": 166.6, "r_x3": 160.8, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.5, "r_y0": 174.6, "r_x1": 254.0, "r_y1": 174.6, "r_x2": 254.0, "r_y2": 166.5, "r_x3": 215.5, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.1, "r_x1": 324.0, "r_y1": 169.1, "r_x2": 324.0, "r_y2": 161.1, "r_x3": 300.4, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.3, "r_y0": 174.6, "r_x1": 414.7, "r_y1": 174.6, "r_x2": 414.7, "r_y2": 166.6, "r_x3": 370.3, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.7, "r_y0": 169.1, "r_x1": 463.1, "r_y1": 169.1, "r_x2": 463.1, "r_y2": 161.1, "r_x3": 426.7, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.1, "r_y0": 180.1, "r_x1": 466.7, "r_y1": 180.1, "r_x2": 466.7, "r_y2": 172.0, "r_x3": 423.1, "r_y3": 172.0, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.4, "r_y0": 182.1, "r_x1": 288.1, "r_y1": 182.1, "r_x2": 288.1, "r_y2": 174.0, "r_x3": 262.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.4, "r_y0": 182.1, "r_x1": 329.4, "r_y1": 182.1, "r_x2": 329.4, "r_y2": 174.0, "r_x3": 296.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.0, "r_y0": 182.1, "r_x1": 354.8, "r_y1": 182.1, "r_x2": 354.8, "r_y2": 174.0, "r_x3": 345.0, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 200.9, "r_x1": 201.2, "r_y1": 200.9, "r_x2": 201.2, "r_y2": 192.9, "r_x3": 154.5, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 195.5, "r_x1": 247.1, "r_y1": 195.5, "r_x2": 247.1, "r_y2": 187.4, "r_x3": 222.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 195.5, "r_x1": 285.7, "r_y1": 195.5, "r_x2": 285.7, "r_y2": 187.4, "r_x3": 264.7, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 195.5, "r_x1": 323.4, "r_y1": 195.5, "r_x2": 323.4, "r_y2": 187.4, "r_x3": 302.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.5, "r_x1": 360.4, "r_y1": 195.5, "r_x2": 360.4, "r_y2": 187.4, "r_x3": 339.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.1, "r_y0": 195.2, "r_x1": 402.0, "r_y1": 195.2, "r_x2": 402.0, "r_y2": 187.3, "r_x3": 383.1, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 195.2, "r_x1": 454.4, "r_y1": 195.2, "r_x2": 454.4, "r_y2": 187.3, "r_x3": 435.5, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.7, "r_y1": 208.4, "r_x2": 248.7, "r_y2": 200.3, "r_x3": 220.9, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 208.4, "r_x1": 285.7, "r_y1": 208.4, "r_x2": 285.7, "r_y2": 200.3, "r_x3": 264.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 208.4, "r_x1": 323.4, "r_y1": 208.4, "r_x2": 323.4, "r_y2": 200.3, "r_x3": 302.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.4, "r_y1": 208.4, "r_x2": 360.4, "r_y2": 200.3, "r_x3": 339.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 208.4, "r_x1": 403.0, "r_y1": 208.4, "r_x2": 403.0, "r_y2": 200.3, "r_x3": 382.1, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 208.4, "r_x1": 453.1, "r_y1": 208.4, "r_x2": 453.1, "r_y2": 200.3, "r_x3": 436.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.9, "r_y0": 227.2, "r_x1": 199.8, "r_y1": 227.2, "r_x2": 199.8, "r_y2": 219.2, "r_x3": 155.9, "r_y3": 219.2, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 221.8, "r_x1": 247.1, "r_y1": 221.8, "r_x2": 247.1, "r_y2": 213.7, "r_x3": 222.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 221.8, "r_x1": 285.7, "r_y1": 221.8, "r_x2": 285.7, "r_y2": 213.7, "r_x3": 264.7, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 221.8, "r_x1": 323.4, "r_y1": 221.8, "r_x2": 323.4, "r_y2": 213.7, "r_x3": 302.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 221.5, "r_x1": 362.0, "r_y1": 221.5, "r_x2": 362.0, "r_y2": 213.6, "r_x3": 337.8, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 221.5, "r_x1": 404.6, "r_y1": 221.5, "r_x2": 404.6, "r_y2": 213.6, "r_x3": 380.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 221.5, "r_x1": 454.4, "r_y1": 221.5, "r_x2": 454.4, "r_y2": 213.6, "r_x3": 435.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.7, "r_y1": 234.7, "r_x2": 248.7, "r_y2": 226.6, "r_x3": 220.9, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 234.7, "r_x1": 285.7, "r_y1": 234.7, "r_x2": 285.7, "r_y2": 226.6, "r_x3": 264.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 234.7, "r_x1": 323.4, "r_y1": 234.7, "r_x2": 323.4, "r_y2": 226.6, "r_x3": 302.4, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.7, "r_y0": 234.7, "r_x1": 358.1, "r_y1": 234.7, "r_x2": 358.1, "r_y2": 226.6, "r_x3": 341.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 234.7, "r_x1": 403.0, "r_y1": 234.7, "r_x2": 403.0, "r_y2": 226.6, "r_x3": 382.1, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 234.7, "r_x1": 453.1, "r_y1": 234.7, "r_x2": 453.1, "r_y2": 226.6, "r_x3": 436.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.6, "r_y0": 253.5, "r_x1": 207.2, "r_y1": 253.5, "r_x2": 207.2, "r_y2": 245.5, "r_x3": 148.6, "r_y3": 245.5, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 248.1, "r_x1": 247.1, "r_y1": 248.1, "r_x2": 247.1, "r_y2": 240.0, "r_x3": 222.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 248.1, "r_x1": 285.7, "r_y1": 248.1, "r_x2": 285.7, "r_y2": 240.0, "r_x3": 264.7, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 248.1, "r_x1": 323.4, "r_y1": 248.1, "r_x2": 323.4, "r_y2": 240.0, "r_x3": 302.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 247.8, "r_x1": 362.0, "r_y1": 247.8, "r_x2": 362.0, "r_y2": 239.9, "r_x3": 337.8, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 247.8, "r_x1": 404.6, "r_y1": 247.8, "r_x2": 404.6, "r_y2": 239.9, "r_x3": 380.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 247.8, "r_x1": 454.4, "r_y1": 247.8, "r_x2": 454.4, "r_y2": 239.9, "r_x3": 435.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.7, "r_y1": 261.0, "r_x2": 248.7, "r_y2": 252.9, "r_x3": 220.9, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 261.0, "r_x1": 285.7, "r_y1": 261.0, "r_x2": 285.7, "r_y2": 252.9, "r_x3": 264.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 261.0, "r_x1": 323.4, "r_y1": 261.0, "r_x2": 323.4, "r_y2": 252.9, "r_x3": 302.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.4, "r_y1": 261.0, "r_x2": 360.4, "r_y2": 252.9, "r_x3": 339.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 261.0, "r_x1": 403.0, "r_y1": 261.0, "r_x2": 403.0, "r_y2": 252.9, "r_x3": 382.1, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 261.0, "r_x1": 453.1, "r_y1": 261.0, "r_x2": 453.1, "r_y2": 252.9, "r_x3": 436.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 10, "label": "text", "bbox": { "l": 160.8, "t": 166.6, "r": 195.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.8, "r_y0": 174.6, "r_x1": 195.0, "r_y1": 174.6, "r_x2": 195.0, "r_y2": 166.6, "r_x3": 160.8, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 215.5, "t": 166.5, "r": 254.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.5, "r_y0": 174.6, "r_x1": 254.0, "r_y1": 174.6, "r_x2": 254.0, "r_y2": 166.5, "r_x3": 215.5, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 300.4, "t": 161.1, "r": 324.0, "b": 169.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.1, "r_x1": 324.0, "r_y1": 169.1, "r_x2": 324.0, "r_y2": 161.1, "r_x3": 300.4, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 370.3, "t": 166.6, "r": 414.7, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.3, "r_y0": 174.6, "r_x1": 414.7, "r_y1": 174.6, "r_x2": 414.7, "r_y2": 166.6, "r_x3": 370.3, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 426.7, "t": 161.1, "r": 463.1, "b": 169.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.7, "r_y0": 169.1, "r_x1": 463.1, "r_y1": 169.1, "r_x2": 463.1, "r_y2": 161.1, "r_x3": 426.7, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 423.1, "t": 172.0, "r": 466.7, "b": 180.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.1, "r_y0": 180.1, "r_x1": 466.7, "r_y1": 180.1, "r_x2": 466.7, "r_y2": 172.0, "r_x3": 423.1, "r_y3": 172.0, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 262.4, "t": 174.0, "r": 288.1, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.4, "r_y0": 182.1, "r_x1": 288.1, "r_y1": 182.1, "r_x2": 288.1, "r_y2": 174.0, "r_x3": 262.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 296.4, "t": 174.0, "r": 329.4, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.4, "r_y0": 182.1, "r_x1": 329.4, "r_y1": 182.1, "r_x2": 329.4, "r_y2": 174.0, "r_x3": 296.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 345.0, "t": 174.0, "r": 354.8, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.0, "r_y0": 182.1, "r_x1": 354.8, "r_y1": 182.1, "r_x2": 354.8, "r_y2": 174.0, "r_x3": 345.0, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 154.5, "t": 192.9, "r": 201.2, "b": 200.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 200.9, "r_x1": 201.2, "r_y1": 200.9, "r_x2": 201.2, "r_y2": 192.9, "r_x3": 154.5, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 222.4, "t": 187.4, "r": 247.1, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 195.5, "r_x1": 247.1, "r_y1": 195.5, "r_x2": 247.1, "r_y2": 187.4, "r_x3": 222.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 264.7, "t": 187.4, "r": 285.7, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 195.5, "r_x1": 285.7, "r_y1": 195.5, "r_x2": 285.7, "r_y2": 187.4, "r_x3": 264.7, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 302.4, "t": 187.4, "r": 323.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 195.5, "r_x1": 323.4, "r_y1": 195.5, "r_x2": 323.4, "r_y2": 187.4, "r_x3": 302.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 339.4, "t": 187.4, "r": 360.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.5, "r_x1": 360.4, "r_y1": 195.5, "r_x2": 360.4, "r_y2": 187.4, "r_x3": 339.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 383.1, "t": 187.3, "r": 402.0, "b": 195.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.1, "r_y0": 195.2, "r_x1": 402.0, "r_y1": 195.2, "r_x2": 402.0, "r_y2": 187.3, "r_x3": 383.1, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 435.5, "t": 187.3, "r": 454.4, "b": 195.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 195.2, "r_x1": 454.4, "r_y1": 195.2, "r_x2": 454.4, "r_y2": 187.3, "r_x3": 435.5, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 220.9, "t": 200.3, "r": 248.7, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.7, "r_y1": 208.4, "r_x2": 248.7, "r_y2": 200.3, "r_x3": 220.9, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 264.7, "t": 200.3, "r": 285.7, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 208.4, "r_x1": 285.7, "r_y1": 208.4, "r_x2": 285.7, "r_y2": 200.3, "r_x3": 264.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 302.4, "t": 200.3, "r": 323.4, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 208.4, "r_x1": 323.4, "r_y1": 208.4, "r_x2": 323.4, "r_y2": 200.3, "r_x3": 302.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 339.4, "t": 200.3, "r": 360.4, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.4, "r_y1": 208.4, "r_x2": 360.4, "r_y2": 200.3, "r_x3": 339.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 382.1, "t": 200.3, "r": 403.0, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 208.4, "r_x1": 403.0, "r_y1": 208.4, "r_x2": 403.0, "r_y2": 200.3, "r_x3": 382.1, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 436.7, "t": 200.3, "r": 453.1, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 208.4, "r_x1": 453.1, "r_y1": 208.4, "r_x2": 453.1, "r_y2": 200.3, "r_x3": 436.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 155.9, "t": 219.2, "r": 199.8, "b": 227.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.9, "r_y0": 227.2, "r_x1": 199.8, "r_y1": 227.2, "r_x2": 199.8, "r_y2": 219.2, "r_x3": 155.9, "r_y3": 219.2, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 222.4, "t": 213.7, "r": 247.1, "b": 221.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 221.8, "r_x1": 247.1, "r_y1": 221.8, "r_x2": 247.1, "r_y2": 213.7, "r_x3": 222.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 264.7, "t": 213.7, "r": 285.7, "b": 221.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 221.8, "r_x1": 285.7, "r_y1": 221.8, "r_x2": 285.7, "r_y2": 213.7, "r_x3": 264.7, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 302.4, "t": 213.7, "r": 323.4, "b": 221.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 221.8, "r_x1": 323.4, "r_y1": 221.8, "r_x2": 323.4, "r_y2": 213.7, "r_x3": 302.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 337.8, "t": 213.6, "r": 362.0, "b": 221.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 221.5, "r_x1": 362.0, "r_y1": 221.5, "r_x2": 362.0, "r_y2": 213.6, "r_x3": 337.8, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 380.5, "t": 213.6, "r": 404.6, "b": 221.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 221.5, "r_x1": 404.6, "r_y1": 221.5, "r_x2": 404.6, "r_y2": 213.6, "r_x3": 380.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 435.5, "t": 213.6, "r": 454.4, "b": 221.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 221.5, "r_x1": 454.4, "r_y1": 221.5, "r_x2": 454.4, "r_y2": 213.6, "r_x3": 435.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 220.9, "t": 226.6, "r": 248.7, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.7, "r_y1": 234.7, "r_x2": 248.7, "r_y2": 226.6, "r_x3": 220.9, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 264.7, "t": 226.6, "r": 285.7, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 234.7, "r_x1": 285.7, "r_y1": 234.7, "r_x2": 285.7, "r_y2": 226.6, "r_x3": 264.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 302.4, "t": 226.6, "r": 323.4, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 234.7, "r_x1": 323.4, "r_y1": 234.7, "r_x2": 323.4, "r_y2": 226.6, "r_x3": 302.4, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 341.7, "t": 226.6, "r": 358.1, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.7, "r_y0": 234.7, "r_x1": 358.1, "r_y1": 234.7, "r_x2": 358.1, "r_y2": 226.6, "r_x3": 341.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 382.1, "t": 226.6, "r": 403.0, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 234.7, "r_x1": 403.0, "r_y1": 234.7, "r_x2": 403.0, "r_y2": 226.6, "r_x3": 382.1, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 436.7, "t": 226.6, "r": 453.1, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 234.7, "r_x1": 453.1, "r_y1": 234.7, "r_x2": 453.1, "r_y2": 226.6, "r_x3": 436.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 148.6, "t": 245.5, "r": 207.2, "b": 253.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.6, "r_y0": 253.5, "r_x1": 207.2, "r_y1": 253.5, "r_x2": 207.2, "r_y2": 245.5, "r_x3": 148.6, "r_y3": 245.5, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 222.4, "t": 240.0, "r": 247.1, "b": 248.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 248.1, "r_x1": 247.1, "r_y1": 248.1, "r_x2": 247.1, "r_y2": 240.0, "r_x3": 222.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 264.7, "t": 240.0, "r": 285.7, "b": 248.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 248.1, "r_x1": 285.7, "r_y1": 248.1, "r_x2": 285.7, "r_y2": 240.0, "r_x3": 264.7, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 302.4, "t": 240.0, "r": 323.4, "b": 248.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 248.1, "r_x1": 323.4, "r_y1": 248.1, "r_x2": 323.4, "r_y2": 240.0, "r_x3": 302.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 337.8, "t": 239.9, "r": 362.0, "b": 247.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 247.8, "r_x1": 362.0, "r_y1": 247.8, "r_x2": 362.0, "r_y2": 239.9, "r_x3": 337.8, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 380.5, "t": 239.9, "r": 404.6, "b": 247.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 247.8, "r_x1": 404.6, "r_y1": 247.8, "r_x2": 404.6, "r_y2": 239.9, "r_x3": 380.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 435.5, "t": 239.9, "r": 454.4, "b": 247.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 247.8, "r_x1": 454.4, "r_y1": 247.8, "r_x2": 454.4, "r_y2": 239.9, "r_x3": 435.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 220.9, "t": 252.9, "r": 248.7, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.7, "r_y1": 261.0, "r_x2": 248.7, "r_y2": 252.9, "r_x3": 220.9, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 264.7, "t": 252.9, "r": 285.7, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 261.0, "r_x1": 285.7, "r_y1": 261.0, "r_x2": 285.7, "r_y2": 252.9, "r_x3": 264.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 302.4, "t": 252.9, "r": 323.4, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 261.0, "r_x1": 323.4, "r_y1": 261.0, "r_x2": 323.4, "r_y2": 252.9, "r_x3": 302.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 339.4, "t": 252.9, "r": 360.4, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.4, "r_y1": 261.0, "r_x2": 360.4, "r_y2": 252.9, "r_x3": 339.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 382.1, "t": 252.9, "r": 403.0, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 261.0, "r_x1": 403.0, "r_y1": 261.0, "r_x2": 403.0, "r_y2": 252.9, "r_x3": 382.1, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 436.7, "t": 252.9, "r": 453.1, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 261.0, "r_x1": 453.1, "r_y1": 261.0, "r_x2": 453.1, "r_y2": 252.9, "r_x3": 436.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ched", "ched", "ched", "ucel", "ucel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 7, "table_cells": [ { "bbox": { "l": 160.8, "t": 166.6, "r": 195.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Data set", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 215.5, "t": 166.5, "r": 254.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 300.4, "t": 161.1, "r": 324.0, "b": 169.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 5, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 370.3, "t": 166.6, "r": 414.7, "b": 174.6, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "mAP(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 426.7, "t": 161.1, "r": 463.1, "b": 169.1, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "Inference time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 262.4, "t": 174.0, "r": 288.1, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 296.4, "t": 174.0, "r": 329.4, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 345.0, "t": 174.0, "r": 354.8, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 154.5, "t": 192.9, "r": 201.2, "b": 200.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.4, "t": 187.4, "r": 247.1, "b": 195.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.7, "t": 187.4, "r": 285.7, "b": 195.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.4, "t": 187.4, "r": 323.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 339.4, "t": 187.4, "r": 360.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 383.1, "t": 187.3, "r": 402.0, "b": 195.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.5, "t": 187.3, "r": 454.4, "b": 195.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 155.9, "t": 219.2, "r": 199.8, "b": 227.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.4, "t": 213.7, "r": 247.1, "b": 221.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.7, "t": 213.7, "r": 285.7, "b": 221.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.955 0.917", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.4, "t": 213.7, "r": 323.4, "b": 221.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.961 0.922", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.8, "t": 213.6, "r": 362.0, "b": 221.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.959 0.92", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.5, "t": 213.6, "r": 404.6, "b": 221.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.862 0.722", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.5, "t": 213.6, "r": 454.4, "b": 221.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.85 3.26", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 148.6, "t": 245.5, "r": 207.2, "b": 253.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTables-1M", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.4, "t": 240.0, "r": 247.1, "b": 248.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.7, "t": 240.0, "r": 285.7, "b": 248.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.987 0.983", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.4, "t": 240.0, "r": 323.4, "b": 248.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.964 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.8, "t": 239.9, "r": 362.0, "b": 247.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.977 0.966", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.5, "t": 239.9, "r": 404.6, "b": 247.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.896 0.889", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.5, "t": 239.9, "r": 454.4, "b": 247.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.79 3.26", "column_header": false, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 7, "page_no": 9, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 144.0, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.83, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 144.0, "r_y1": 101.8, "r_x2": 144.0, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10" }, { "label": "page_header", "id": 6, "page_no": 9, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.84, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "caption", "id": 4, "page_no": 9, "cluster": { "id": 4, "label": "caption", "bbox": { "l": 134.8, "t": 115.8, "r": 480.6, "b": 145.9, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 123.8, "r_x1": 173.1, "r_y1": 123.8, "r_x2": 173.1, "r_y2": 115.8, "r_x3": 134.8, "r_y3": 115.8, "coord_origin": "TOPLEFT" }, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.3, "r_y0": 124.0, "r_x1": 480.6, "r_y1": 124.0, "r_x2": 480.6, "r_y2": 115.9, "r_x3": 181.3, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 134.9, "r_x1": 480.6, "r_y1": 134.9, "r_x2": 480.6, "r_y2": 126.9, "r_x3": 134.8, "r_y3": 126.9, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 145.9, "r_x1": 306.0, "r_y1": 145.9, "r_x2": 306.0, "r_y2": 137.8, "r_x3": 134.8, "r_y3": 137.8, "coord_origin": "TOPLEFT" }, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 2. TSR and cell detection results compared between OTSL and HTML on the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using TableFormer [9] (with enc=6, dec=6, heads=8)." }, { "label": "table", "id": 0, "page_no": 9, "cluster": { "id": 0, "label": "table", "bbox": { "l": 143.6, "t": 156.3, "r": 470.8, "b": 263.3, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.8, "r_y0": 174.6, "r_x1": 195.0, "r_y1": 174.6, "r_x2": 195.0, "r_y2": 166.6, "r_x3": 160.8, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.5, "r_y0": 174.6, "r_x1": 254.0, "r_y1": 174.6, "r_x2": 254.0, "r_y2": 166.5, "r_x3": 215.5, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.1, "r_x1": 324.0, "r_y1": 169.1, "r_x2": 324.0, "r_y2": 161.1, "r_x3": 300.4, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.3, "r_y0": 174.6, "r_x1": 414.7, "r_y1": 174.6, "r_x2": 414.7, "r_y2": 166.6, "r_x3": 370.3, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.7, "r_y0": 169.1, "r_x1": 463.1, "r_y1": 169.1, "r_x2": 463.1, "r_y2": 161.1, "r_x3": 426.7, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.1, "r_y0": 180.1, "r_x1": 466.7, "r_y1": 180.1, "r_x2": 466.7, "r_y2": 172.0, "r_x3": 423.1, "r_y3": 172.0, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.4, "r_y0": 182.1, "r_x1": 288.1, "r_y1": 182.1, "r_x2": 288.1, "r_y2": 174.0, "r_x3": 262.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.4, "r_y0": 182.1, "r_x1": 329.4, "r_y1": 182.1, "r_x2": 329.4, "r_y2": 174.0, "r_x3": 296.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.0, "r_y0": 182.1, "r_x1": 354.8, "r_y1": 182.1, "r_x2": 354.8, "r_y2": 174.0, "r_x3": 345.0, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 200.9, "r_x1": 201.2, "r_y1": 200.9, "r_x2": 201.2, "r_y2": 192.9, "r_x3": 154.5, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 195.5, "r_x1": 247.1, "r_y1": 195.5, "r_x2": 247.1, "r_y2": 187.4, "r_x3": 222.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 195.5, "r_x1": 285.7, "r_y1": 195.5, "r_x2": 285.7, "r_y2": 187.4, "r_x3": 264.7, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 195.5, "r_x1": 323.4, "r_y1": 195.5, "r_x2": 323.4, "r_y2": 187.4, "r_x3": 302.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.5, "r_x1": 360.4, "r_y1": 195.5, "r_x2": 360.4, "r_y2": 187.4, "r_x3": 339.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.1, "r_y0": 195.2, "r_x1": 402.0, "r_y1": 195.2, "r_x2": 402.0, "r_y2": 187.3, "r_x3": 383.1, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 195.2, "r_x1": 454.4, "r_y1": 195.2, "r_x2": 454.4, "r_y2": 187.3, "r_x3": 435.5, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.7, "r_y1": 208.4, "r_x2": 248.7, "r_y2": 200.3, "r_x3": 220.9, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 208.4, "r_x1": 285.7, "r_y1": 208.4, "r_x2": 285.7, "r_y2": 200.3, "r_x3": 264.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 208.4, "r_x1": 323.4, "r_y1": 208.4, "r_x2": 323.4, "r_y2": 200.3, "r_x3": 302.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.4, "r_y1": 208.4, "r_x2": 360.4, "r_y2": 200.3, "r_x3": 339.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 208.4, "r_x1": 403.0, "r_y1": 208.4, "r_x2": 403.0, "r_y2": 200.3, "r_x3": 382.1, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 208.4, "r_x1": 453.1, "r_y1": 208.4, "r_x2": 453.1, "r_y2": 200.3, "r_x3": 436.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.9, "r_y0": 227.2, "r_x1": 199.8, "r_y1": 227.2, "r_x2": 199.8, "r_y2": 219.2, "r_x3": 155.9, "r_y3": 219.2, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 221.8, "r_x1": 247.1, "r_y1": 221.8, "r_x2": 247.1, "r_y2": 213.7, "r_x3": 222.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 221.8, "r_x1": 285.7, "r_y1": 221.8, "r_x2": 285.7, "r_y2": 213.7, "r_x3": 264.7, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 221.8, "r_x1": 323.4, "r_y1": 221.8, "r_x2": 323.4, "r_y2": 213.7, "r_x3": 302.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 221.5, "r_x1": 362.0, "r_y1": 221.5, "r_x2": 362.0, "r_y2": 213.6, "r_x3": 337.8, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 221.5, "r_x1": 404.6, "r_y1": 221.5, "r_x2": 404.6, "r_y2": 213.6, "r_x3": 380.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 221.5, "r_x1": 454.4, "r_y1": 221.5, "r_x2": 454.4, "r_y2": 213.6, "r_x3": 435.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.7, "r_y1": 234.7, "r_x2": 248.7, "r_y2": 226.6, "r_x3": 220.9, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 234.7, "r_x1": 285.7, "r_y1": 234.7, "r_x2": 285.7, "r_y2": 226.6, "r_x3": 264.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 234.7, "r_x1": 323.4, "r_y1": 234.7, "r_x2": 323.4, "r_y2": 226.6, "r_x3": 302.4, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.7, "r_y0": 234.7, "r_x1": 358.1, "r_y1": 234.7, "r_x2": 358.1, "r_y2": 226.6, "r_x3": 341.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 234.7, "r_x1": 403.0, "r_y1": 234.7, "r_x2": 403.0, "r_y2": 226.6, "r_x3": 382.1, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 234.7, "r_x1": 453.1, "r_y1": 234.7, "r_x2": 453.1, "r_y2": 226.6, "r_x3": 436.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.6, "r_y0": 253.5, "r_x1": 207.2, "r_y1": 253.5, "r_x2": 207.2, "r_y2": 245.5, "r_x3": 148.6, "r_y3": 245.5, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 248.1, "r_x1": 247.1, "r_y1": 248.1, "r_x2": 247.1, "r_y2": 240.0, "r_x3": 222.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 248.1, "r_x1": 285.7, "r_y1": 248.1, "r_x2": 285.7, "r_y2": 240.0, "r_x3": 264.7, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 248.1, "r_x1": 323.4, "r_y1": 248.1, "r_x2": 323.4, "r_y2": 240.0, "r_x3": 302.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 247.8, "r_x1": 362.0, "r_y1": 247.8, "r_x2": 362.0, "r_y2": 239.9, "r_x3": 337.8, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 247.8, "r_x1": 404.6, "r_y1": 247.8, "r_x2": 404.6, "r_y2": 239.9, "r_x3": 380.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 247.8, "r_x1": 454.4, "r_y1": 247.8, "r_x2": 454.4, "r_y2": 239.9, "r_x3": 435.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.7, "r_y1": 261.0, "r_x2": 248.7, "r_y2": 252.9, "r_x3": 220.9, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 261.0, "r_x1": 285.7, "r_y1": 261.0, "r_x2": 285.7, "r_y2": 252.9, "r_x3": 264.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 261.0, "r_x1": 323.4, "r_y1": 261.0, "r_x2": 323.4, "r_y2": 252.9, "r_x3": 302.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.4, "r_y1": 261.0, "r_x2": 360.4, "r_y2": 252.9, "r_x3": 339.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 261.0, "r_x1": 403.0, "r_y1": 261.0, "r_x2": 403.0, "r_y2": 252.9, "r_x3": 382.1, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 261.0, "r_x1": 453.1, "r_y1": 261.0, "r_x2": 453.1, "r_y2": 252.9, "r_x3": 436.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 10, "label": "text", "bbox": { "l": 160.8, "t": 166.6, "r": 195.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.8, "r_y0": 174.6, "r_x1": 195.0, "r_y1": 174.6, "r_x2": 195.0, "r_y2": 166.6, "r_x3": 160.8, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 215.5, "t": 166.5, "r": 254.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.5, "r_y0": 174.6, "r_x1": 254.0, "r_y1": 174.6, "r_x2": 254.0, "r_y2": 166.5, "r_x3": 215.5, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 300.4, "t": 161.1, "r": 324.0, "b": 169.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.1, "r_x1": 324.0, "r_y1": 169.1, "r_x2": 324.0, "r_y2": 161.1, "r_x3": 300.4, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 370.3, "t": 166.6, "r": 414.7, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.3, "r_y0": 174.6, "r_x1": 414.7, "r_y1": 174.6, "r_x2": 414.7, "r_y2": 166.6, "r_x3": 370.3, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 426.7, "t": 161.1, "r": 463.1, "b": 169.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.7, "r_y0": 169.1, "r_x1": 463.1, "r_y1": 169.1, "r_x2": 463.1, "r_y2": 161.1, "r_x3": 426.7, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 423.1, "t": 172.0, "r": 466.7, "b": 180.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.1, "r_y0": 180.1, "r_x1": 466.7, "r_y1": 180.1, "r_x2": 466.7, "r_y2": 172.0, "r_x3": 423.1, "r_y3": 172.0, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 262.4, "t": 174.0, "r": 288.1, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.4, "r_y0": 182.1, "r_x1": 288.1, "r_y1": 182.1, "r_x2": 288.1, "r_y2": 174.0, "r_x3": 262.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 296.4, "t": 174.0, "r": 329.4, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.4, "r_y0": 182.1, "r_x1": 329.4, "r_y1": 182.1, "r_x2": 329.4, "r_y2": 174.0, "r_x3": 296.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 345.0, "t": 174.0, "r": 354.8, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.0, "r_y0": 182.1, "r_x1": 354.8, "r_y1": 182.1, "r_x2": 354.8, "r_y2": 174.0, "r_x3": 345.0, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 154.5, "t": 192.9, "r": 201.2, "b": 200.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 200.9, "r_x1": 201.2, "r_y1": 200.9, "r_x2": 201.2, "r_y2": 192.9, "r_x3": 154.5, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 222.4, "t": 187.4, "r": 247.1, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 195.5, "r_x1": 247.1, "r_y1": 195.5, "r_x2": 247.1, "r_y2": 187.4, "r_x3": 222.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 264.7, "t": 187.4, "r": 285.7, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 195.5, "r_x1": 285.7, "r_y1": 195.5, "r_x2": 285.7, "r_y2": 187.4, "r_x3": 264.7, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 302.4, "t": 187.4, "r": 323.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 195.5, "r_x1": 323.4, "r_y1": 195.5, "r_x2": 323.4, "r_y2": 187.4, "r_x3": 302.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 339.4, "t": 187.4, "r": 360.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.5, "r_x1": 360.4, "r_y1": 195.5, "r_x2": 360.4, "r_y2": 187.4, "r_x3": 339.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 383.1, "t": 187.3, "r": 402.0, "b": 195.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.1, "r_y0": 195.2, "r_x1": 402.0, "r_y1": 195.2, "r_x2": 402.0, "r_y2": 187.3, "r_x3": 383.1, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 435.5, "t": 187.3, "r": 454.4, "b": 195.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 195.2, "r_x1": 454.4, "r_y1": 195.2, "r_x2": 454.4, "r_y2": 187.3, "r_x3": 435.5, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 220.9, "t": 200.3, "r": 248.7, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.7, "r_y1": 208.4, "r_x2": 248.7, "r_y2": 200.3, "r_x3": 220.9, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 264.7, "t": 200.3, "r": 285.7, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 208.4, "r_x1": 285.7, "r_y1": 208.4, "r_x2": 285.7, "r_y2": 200.3, "r_x3": 264.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 302.4, "t": 200.3, "r": 323.4, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 208.4, "r_x1": 323.4, "r_y1": 208.4, "r_x2": 323.4, "r_y2": 200.3, "r_x3": 302.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 339.4, "t": 200.3, "r": 360.4, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.4, "r_y1": 208.4, "r_x2": 360.4, "r_y2": 200.3, "r_x3": 339.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 382.1, "t": 200.3, "r": 403.0, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 208.4, "r_x1": 403.0, "r_y1": 208.4, "r_x2": 403.0, "r_y2": 200.3, "r_x3": 382.1, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 436.7, "t": 200.3, "r": 453.1, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 208.4, "r_x1": 453.1, "r_y1": 208.4, "r_x2": 453.1, "r_y2": 200.3, "r_x3": 436.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 155.9, "t": 219.2, "r": 199.8, "b": 227.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.9, "r_y0": 227.2, "r_x1": 199.8, "r_y1": 227.2, "r_x2": 199.8, "r_y2": 219.2, "r_x3": 155.9, "r_y3": 219.2, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 222.4, "t": 213.7, "r": 247.1, "b": 221.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 221.8, "r_x1": 247.1, "r_y1": 221.8, "r_x2": 247.1, "r_y2": 213.7, "r_x3": 222.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 264.7, "t": 213.7, "r": 285.7, "b": 221.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 221.8, "r_x1": 285.7, "r_y1": 221.8, "r_x2": 285.7, "r_y2": 213.7, "r_x3": 264.7, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 302.4, "t": 213.7, "r": 323.4, "b": 221.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 221.8, "r_x1": 323.4, "r_y1": 221.8, "r_x2": 323.4, "r_y2": 213.7, "r_x3": 302.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 337.8, "t": 213.6, "r": 362.0, "b": 221.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 221.5, "r_x1": 362.0, "r_y1": 221.5, "r_x2": 362.0, "r_y2": 213.6, "r_x3": 337.8, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 380.5, "t": 213.6, "r": 404.6, "b": 221.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 221.5, "r_x1": 404.6, "r_y1": 221.5, "r_x2": 404.6, "r_y2": 213.6, "r_x3": 380.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 435.5, "t": 213.6, "r": 454.4, "b": 221.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 221.5, "r_x1": 454.4, "r_y1": 221.5, "r_x2": 454.4, "r_y2": 213.6, "r_x3": 435.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 220.9, "t": 226.6, "r": 248.7, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.7, "r_y1": 234.7, "r_x2": 248.7, "r_y2": 226.6, "r_x3": 220.9, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 264.7, "t": 226.6, "r": 285.7, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 234.7, "r_x1": 285.7, "r_y1": 234.7, "r_x2": 285.7, "r_y2": 226.6, "r_x3": 264.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 302.4, "t": 226.6, "r": 323.4, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 234.7, "r_x1": 323.4, "r_y1": 234.7, "r_x2": 323.4, "r_y2": 226.6, "r_x3": 302.4, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 341.7, "t": 226.6, "r": 358.1, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.7, "r_y0": 234.7, "r_x1": 358.1, "r_y1": 234.7, "r_x2": 358.1, "r_y2": 226.6, "r_x3": 341.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 382.1, "t": 226.6, "r": 403.0, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 234.7, "r_x1": 403.0, "r_y1": 234.7, "r_x2": 403.0, "r_y2": 226.6, "r_x3": 382.1, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 436.7, "t": 226.6, "r": 453.1, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 234.7, "r_x1": 453.1, "r_y1": 234.7, "r_x2": 453.1, "r_y2": 226.6, "r_x3": 436.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 148.6, "t": 245.5, "r": 207.2, "b": 253.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.6, "r_y0": 253.5, "r_x1": 207.2, "r_y1": 253.5, "r_x2": 207.2, "r_y2": 245.5, "r_x3": 148.6, "r_y3": 245.5, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 222.4, "t": 240.0, "r": 247.1, "b": 248.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 248.1, "r_x1": 247.1, "r_y1": 248.1, "r_x2": 247.1, "r_y2": 240.0, "r_x3": 222.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 264.7, "t": 240.0, "r": 285.7, "b": 248.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 248.1, "r_x1": 285.7, "r_y1": 248.1, "r_x2": 285.7, "r_y2": 240.0, "r_x3": 264.7, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 302.4, "t": 240.0, "r": 323.4, "b": 248.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 248.1, "r_x1": 323.4, "r_y1": 248.1, "r_x2": 323.4, "r_y2": 240.0, "r_x3": 302.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 337.8, "t": 239.9, "r": 362.0, "b": 247.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 247.8, "r_x1": 362.0, "r_y1": 247.8, "r_x2": 362.0, "r_y2": 239.9, "r_x3": 337.8, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 380.5, "t": 239.9, "r": 404.6, "b": 247.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 247.8, "r_x1": 404.6, "r_y1": 247.8, "r_x2": 404.6, "r_y2": 239.9, "r_x3": 380.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 435.5, "t": 239.9, "r": 454.4, "b": 247.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 247.8, "r_x1": 454.4, "r_y1": 247.8, "r_x2": 454.4, "r_y2": 239.9, "r_x3": 435.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 220.9, "t": 252.9, "r": 248.7, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.7, "r_y1": 261.0, "r_x2": 248.7, "r_y2": 252.9, "r_x3": 220.9, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 264.7, "t": 252.9, "r": 285.7, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 261.0, "r_x1": 285.7, "r_y1": 261.0, "r_x2": 285.7, "r_y2": 252.9, "r_x3": 264.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 302.4, "t": 252.9, "r": 323.4, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 261.0, "r_x1": 323.4, "r_y1": 261.0, "r_x2": 323.4, "r_y2": 252.9, "r_x3": 302.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 339.4, "t": 252.9, "r": 360.4, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.4, "r_y1": 261.0, "r_x2": 360.4, "r_y2": 252.9, "r_x3": 339.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 382.1, "t": 252.9, "r": 403.0, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 261.0, "r_x1": 403.0, "r_y1": 261.0, "r_x2": 403.0, "r_y2": 252.9, "r_x3": 382.1, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 436.7, "t": 252.9, "r": 453.1, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 261.0, "r_x1": 453.1, "r_y1": 261.0, "r_x2": 453.1, "r_y2": 252.9, "r_x3": 436.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ched", "ched", "ched", "ucel", "ucel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 7, "table_cells": [ { "bbox": { "l": 160.8, "t": 166.6, "r": 195.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Data set", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 215.5, "t": 166.5, "r": 254.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 300.4, "t": 161.1, "r": 324.0, "b": 169.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 5, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 370.3, "t": 166.6, "r": 414.7, "b": 174.6, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "mAP(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 426.7, "t": 161.1, "r": 463.1, "b": 169.1, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "Inference time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 262.4, "t": 174.0, "r": 288.1, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 296.4, "t": 174.0, "r": 329.4, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 345.0, "t": 174.0, "r": 354.8, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 154.5, "t": 192.9, "r": 201.2, "b": 200.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.4, "t": 187.4, "r": 247.1, "b": 195.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.7, "t": 187.4, "r": 285.7, "b": 195.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.4, "t": 187.4, "r": 323.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 339.4, "t": 187.4, "r": 360.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 383.1, "t": 187.3, "r": 402.0, "b": 195.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.5, "t": 187.3, "r": 454.4, "b": 195.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 155.9, "t": 219.2, "r": 199.8, "b": 227.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.4, "t": 213.7, "r": 247.1, "b": 221.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.7, "t": 213.7, "r": 285.7, "b": 221.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.955 0.917", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.4, "t": 213.7, "r": 323.4, "b": 221.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.961 0.922", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.8, "t": 213.6, "r": 362.0, "b": 221.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.959 0.92", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.5, "t": 213.6, "r": 404.6, "b": 221.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.862 0.722", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.5, "t": 213.6, "r": 454.4, "b": 221.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.85 3.26", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 148.6, "t": 245.5, "r": 207.2, "b": 253.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTables-1M", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.4, "t": 240.0, "r": 247.1, "b": 248.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.7, "t": 240.0, "r": 285.7, "b": 248.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.987 0.983", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.4, "t": 240.0, "r": 323.4, "b": 248.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.964 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.8, "t": 239.9, "r": 362.0, "b": 247.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.977 0.966", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.5, "t": 239.9, "r": 404.6, "b": 247.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.896 0.889", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.5, "t": 239.9, "r": 454.4, "b": 247.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.79 3.26", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "section_header", "id": 3, "page_no": 9, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.8, "t": 288.9, "r": 257.1, "b": 297.7, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 297.7, "r_x1": 149.4, "r_y1": 297.7, "r_x2": 149.4, "r_y2": 288.9, "r_x3": 134.8, "r_y3": 288.9, "coord_origin": "TOPLEFT" }, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 297.7, "r_x1": 257.1, "r_y1": 297.7, "r_x2": 257.1, "r_y2": 288.9, "r_x3": 160.9, "r_y3": 288.9, "coord_origin": "TOPLEFT" }, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.3 Qualitative Results" }, { "label": "text", "id": 1, "page_no": 9, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 309.9, "r": 480.6, "b": 366.5, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 318.7, "r_x1": 480.6, "r_y1": 318.7, "r_x2": 480.6, "r_y2": 309.9, "r_x3": 134.8, "r_y3": 309.9, "coord_origin": "TOPLEFT" }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "orig": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 330.6, "r_x1": 480.6, "r_y1": 330.6, "r_x2": 480.6, "r_y2": 321.8, "r_x3": 134.8, "r_y3": 321.8, "coord_origin": "TOPLEFT" }, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 342.6, "r_x1": 480.6, "r_y1": 342.6, "r_x2": 480.6, "r_y2": 333.8, "r_x3": 134.8, "r_y3": 333.8, "coord_origin": "TOPLEFT" }, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 354.5, "r_x1": 480.6, "r_y1": 354.5, "r_x2": 480.6, "r_y2": 345.7, "r_x3": 134.8, "r_y3": 345.7, "coord_origin": "TOPLEFT" }, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 366.5, "r_x1": 161.7, "r_y1": 366.5, "r_x2": 161.7, "r_y2": 357.7, "r_x3": 134.8, "r_y3": 357.7, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5 demonstrates less overlap and more accurate bounding boxes with OTSL. In Figure 6, OTSL proves to be more effective in handling tables with longer token sequences, resulting in even more precise structure prediction and bounding boxes." }, { "label": "caption", "id": 5, "page_no": 9, "cluster": { "id": 5, "label": "caption", "bbox": { "l": 134.8, "t": 397.6, "r": 480.6, "b": 439.7, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 405.5, "r_x1": 162.6, "r_y1": 405.5, "r_x2": 162.6, "r_y2": 397.6, "r_x3": 134.8, "r_y3": 397.6, "coord_origin": "TOPLEFT" }, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.4, "r_y0": 405.7, "r_x1": 480.6, "r_y1": 405.7, "r_x2": 480.6, "r_y2": 397.7, "r_x3": 167.4, "r_y3": 397.7, "coord_origin": "TOPLEFT" }, "text": "The OTSL model produces more accurate bounding boxes with less over-", "orig": "The OTSL model produces more accurate bounding boxes with less over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 416.7, "r_x1": 480.6, "r_y1": 416.7, "r_x2": 480.6, "r_y2": 408.6, "r_x3": 134.8, "r_y3": 408.6, "coord_origin": "TOPLEFT" }, "text": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 427.6, "r_x1": 480.6, "r_y1": 427.6, "r_x2": 480.6, "r_y2": 419.6, "r_x3": 134.8, "r_y3": 419.6, "coord_origin": "TOPLEFT" }, "text": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "orig": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 438.6, "r_x1": 304.7, "r_y1": 438.6, "r_x2": 304.7, "r_y2": 430.5, "r_x3": 134.8, "r_y3": 430.5, "coord_origin": "TOPLEFT" }, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 342.6, "r_y0": 439.7, "r_x1": 344.8, "r_y1": 439.7, "r_x2": 344.8, "r_y2": 430.2, "r_x3": 342.6, "r_y3": 430.2, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 5. The OTSL model produces more accurate bounding boxes with less overlap (E) than the HTML model (D), when predicting the structure of a sparse table (A), at twice the inference speed because of shorter sequence length (B),(C). \"PMC2807444_006_00.png\" PubTabNet. \u03bc" }, { "label": "picture", "id": 2, "page_no": 9, "cluster": { "id": 2, "label": "picture", "bbox": { "l": 162.7, "t": 444.6, "r": 451.7, "b": 663.2, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 518.9, "r_x1": 190.6, "r_y1": 518.9, "r_x2": 190.6, "r_y2": 516.2, "r_x3": 180.1, "r_y3": 516.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 522.8, "r_x1": 304.5, "r_y1": 522.8, "r_x2": 304.5, "r_y2": 520.1, "r_x3": 183.2, "r_y3": 520.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 526.7, "r_x1": 388.4, "r_y1": 526.7, "r_x2": 388.4, "r_y2": 524.0, "r_x3": 183.2, "r_y3": 524.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 530.6, "r_x1": 388.4, "r_y1": 530.6, "r_x2": 388.4, "r_y2": 527.9, "r_x3": 183.2, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 534.5, "r_x1": 388.4, "r_y1": 534.5, "r_x2": 388.4, "r_y2": 531.8, "r_x3": 183.2, "r_y3": 531.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 538.4, "r_x1": 388.4, "r_y1": 538.4, "r_x2": 388.4, "r_y2": 535.7, "r_x3": 183.2, "r_y3": 535.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 542.3, "r_x1": 388.4, "r_y1": 542.3, "r_x2": 388.4, "r_y2": 539.6, "r_x3": 183.2, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 546.2, "r_x1": 388.4, "r_y1": 546.2, "r_x2": 388.4, "r_y2": 543.5, "r_x3": 183.2, "r_y3": 543.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 550.1, "r_x1": 388.4, "r_y1": 550.1, "r_x2": 388.4, "r_y2": 547.4, "r_x3": 183.2, "r_y3": 547.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 554.0, "r_x1": 388.4, "r_y1": 554.0, "r_x2": 388.4, "r_y2": 551.3, "r_x3": 183.2, "r_y3": 551.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 557.9, "r_x1": 191.9, "r_y1": 557.9, "r_x2": 191.9, "r_y2": 555.2, "r_x3": 180.1, "r_y3": 555.2, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 521.0, "r_x1": 408.8, "r_y1": 521.0, "r_x2": 408.8, "r_y2": 518.3, "r_x3": 407.4, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 521.0, "r_x1": 450.5, "r_y1": 521.0, "r_x2": 450.5, "r_y2": 518.3, "r_x3": 410.3, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 524.9, "r_x1": 408.8, "r_y1": 524.9, "r_x2": 408.8, "r_y2": 522.2, "r_x3": 407.4, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 524.9, "r_x1": 450.5, "r_y1": 524.9, "r_x2": 450.5, "r_y2": 522.2, "r_x3": 410.3, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 528.8, "r_x1": 408.8, "r_y1": 528.8, "r_x2": 408.8, "r_y2": 526.1, "r_x3": 407.4, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 528.8, "r_x1": 450.5, "r_y1": 528.8, "r_x2": 450.5, "r_y2": 526.1, "r_x3": 410.3, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 532.7, "r_x1": 408.8, "r_y1": 532.7, "r_x2": 408.8, "r_y2": 530.0, "r_x3": 407.4, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 532.7, "r_x1": 450.5, "r_y1": 532.7, "r_x2": 450.5, "r_y2": 530.0, "r_x3": 410.3, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 536.6, "r_x1": 408.8, "r_y1": 536.6, "r_x2": 408.8, "r_y2": 533.9, "r_x3": 407.4, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 536.6, "r_x1": 450.5, "r_y1": 536.6, "r_x2": 450.5, "r_y2": 533.9, "r_x3": 410.3, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 540.5, "r_x1": 408.8, "r_y1": 540.5, "r_x2": 408.8, "r_y2": 537.8, "r_x3": 407.4, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 540.5, "r_x1": 450.5, "r_y1": 540.5, "r_x2": 450.5, "r_y2": 537.8, "r_x3": 410.3, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 544.4, "r_x1": 408.8, "r_y1": 544.4, "r_x2": 408.8, "r_y2": 541.7, "r_x3": 407.4, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 544.4, "r_x1": 450.5, "r_y1": 544.4, "r_x2": 450.5, "r_y2": 541.7, "r_x3": 410.3, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 548.3, "r_x1": 408.8, "r_y1": 548.3, "r_x2": 408.8, "r_y2": 545.6, "r_x3": 407.4, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 548.3, "r_x1": 450.5, "r_y1": 548.3, "r_x2": 450.5, "r_y2": 545.6, "r_x3": 410.3, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 552.2, "r_x1": 408.8, "r_y1": 552.2, "r_x2": 408.8, "r_y2": 549.5, "r_x3": 407.4, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 552.2, "r_x1": 450.5, "r_y1": 552.2, "r_x2": 450.5, "r_y2": 549.5, "r_x3": 410.3, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.5, "r_y0": 515.3, "r_x1": 181.9, "r_y1": 515.3, "r_x2": 181.9, "r_y2": 509.5, "r_x3": 164.5, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.6, "r_y0": 515.3, "r_x1": 186.4, "r_y1": 515.3, "r_x2": 186.4, "r_y2": 509.5, "r_x3": 183.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2, "r_y0": 515.3, "r_x1": 208.9, "r_y1": 515.3, "r_x2": 208.9, "r_y2": 509.5, "r_x3": 189.2, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.6, "r_y0": 515.3, "r_x1": 221.0, "r_y1": 515.3, "r_x2": 221.0, "r_y2": 509.5, "r_x3": 210.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.5, "r_x1": 406.8, "r_y1": 515.5, "r_x2": 406.8, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.6, "r_y0": 515.5, "r_x1": 411.4, "r_y1": 515.5, "r_x2": 411.4, "r_y2": 509.6, "r_x3": 408.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.5, "r_x1": 433.9, "r_y1": 515.5, "r_x2": 433.9, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 515.5, "r_x1": 446.0, "r_y1": 515.5, "r_x2": 446.0, "r_y2": 509.6, "r_x3": 435.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.2, "r_y0": 526.4, "r_x1": 172.8, "r_y1": 526.4, "r_x2": 172.8, "r_y2": 519.1, "r_x3": 167.2, "r_y3": 519.1, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.3, "r_y0": 455.9, "r_x1": 193.0, "r_y1": 455.9, "r_x2": 193.0, "r_y2": 448.6, "r_x3": 187.3, "r_y3": 448.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.4, "r_y0": 573.3, "r_x1": 173.0, "r_y1": 573.3, "r_x2": 173.0, "r_y2": 566.0, "r_x3": 167.4, "r_y3": 566.0, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.5, "r_y0": 629.1, "r_x1": 253.7, "r_y1": 629.1, "r_x2": 253.7, "r_y2": 621.8, "r_x3": 248.5, "r_y3": 621.8, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.5, "r_x1": 401.5, "r_y1": 526.5, "r_x2": 401.5, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.6, "r_y0": 597.3, "r_x1": 177.5, "r_y1": 597.3, "r_x2": 177.5, "r_y2": 580.3, "r_x3": 171.6, "r_y3": 580.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.1, "r_y0": 649.9, "r_x1": 256.9, "r_y1": 649.9, "r_x2": 256.9, "r_y2": 633.6, "r_x3": 251.1, "r_y3": 633.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 607.3, "r_x1": 427.0, "r_y1": 607.3, "r_x2": 427.0, "r_y2": 601.5, "r_x3": 372.1, "r_y3": 601.5, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 613.8, "r_x1": 430.1, "r_y1": 613.8, "r_x2": 430.1, "r_y2": 607.9, "r_x3": 372.1, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 648.7, "r_x1": 231.1, "r_y1": 648.7, "r_x2": 231.1, "r_y2": 642.9, "r_x3": 176.9, "r_y3": 642.9, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 655.2, "r_x1": 231.0, "r_y1": 655.2, "r_x2": 231.0, "r_y2": 649.3, "r_x3": 176.9, "r_y3": 649.3, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 661.6, "r_x1": 203.9, "r_y1": 661.6, "r_x2": 203.9, "r_y2": 655.8, "r_x3": 176.9, "r_y3": 655.8, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.9, "r_y0": 569.2, "r_x1": 218.5, "r_y1": 569.2, "r_x2": 218.5, "r_y2": 557.6, "r_x3": 215.9, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.1, "r_y0": 569.2, "r_x1": 231.7, "r_y1": 569.2, "r_x2": 231.7, "r_y2": 557.6, "r_x3": 229.1, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.2, "r_y0": 451.2, "r_x1": 263.6, "r_y1": 451.2, "r_x2": 263.6, "r_y2": 448.5, "r_x3": 261.2, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.3, "r_y0": 451.2, "r_x1": 313.6, "r_y1": 451.2, "r_x2": 313.6, "r_y2": 448.5, "r_x3": 312.3, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.4, "r_y0": 451.2, "r_x1": 380.1, "r_y1": 451.2, "r_x2": 380.1, "r_y2": 448.5, "r_x3": 377.4, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 456.1, "r_x1": 205.8, "r_y1": 456.1, "r_x2": 205.8, "r_y2": 453.3, "r_x3": 200.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.2, "r_y0": 456.1, "r_x1": 229.8, "r_y1": 456.1, "r_x2": 229.8, "r_y2": 453.3, "r_x3": 222.2, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 456.1, "r_x1": 250.8, "r_y1": 456.1, "r_x2": 250.8, "r_y2": 453.3, "r_x3": 243.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.1, "r_x1": 271.8, "r_y1": 456.1, "r_x2": 271.8, "r_y2": 453.3, "r_x3": 264.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.3, "r_y0": 456.1, "r_x1": 292.9, "r_y1": 456.1, "r_x2": 292.9, "r_y2": 453.3, "r_x3": 285.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 456.1, "r_x1": 311.8, "r_y1": 456.1, "r_x2": 311.8, "r_y2": 453.3, "r_x3": 306.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 456.1, "r_x1": 325.6, "r_y1": 456.1, "r_x2": 325.6, "r_y2": 453.3, "r_x3": 323.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 456.1, "r_x1": 336.6, "r_y1": 456.1, "r_x2": 336.6, "r_y2": 453.3, "r_x3": 334.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 456.1, "r_x1": 347.7, "r_y1": 456.1, "r_x2": 347.7, "r_y2": 453.3, "r_x3": 345.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 456.1, "r_x1": 358.7, "r_y1": 456.1, "r_x2": 358.7, "r_y2": 453.3, "r_x3": 356.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 456.1, "r_x1": 372.0, "r_y1": 456.1, "r_x2": 372.0, "r_y2": 453.3, "r_x3": 367.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 456.1, "r_x1": 387.0, "r_y1": 456.1, "r_x2": 387.0, "r_y2": 453.3, "r_x3": 382.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 456.1, "r_x1": 402.1, "r_y1": 456.1, "r_x2": 402.1, "r_y2": 453.3, "r_x3": 397.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 457.8, "r_x1": 414.9, "r_y1": 457.8, "r_x2": 414.9, "r_y2": 448.0, "r_x3": 412.8, "r_y3": 448.0, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.0, "r_y0": 456.1, "r_x1": 422.5, "r_y1": 456.1, "r_x2": 422.5, "r_y2": 453.3, "r_x3": 415.0, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 466.7, "r_x1": 204.6, "r_y1": 466.7, "r_x2": 204.6, "r_y2": 463.9, "r_x3": 200.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 466.7, "r_x1": 369.6, "r_y1": 466.7, "r_x2": 369.6, "r_y2": 463.9, "r_x3": 367.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 466.7, "r_x1": 384.6, "r_y1": 466.7, "r_x2": 384.6, "r_y2": 463.9, "r_x3": 382.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 466.7, "r_x1": 399.7, "r_y1": 466.7, "r_x2": 399.7, "r_y2": 463.9, "r_x3": 397.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 471.5, "r_x1": 206.5, "r_y1": 471.5, "r_x2": 206.5, "r_y2": 468.8, "r_x3": 200.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 471.5, "r_x1": 266.3, "r_y1": 471.5, "r_x2": 266.3, "r_y2": 468.8, "r_x3": 264.3, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 471.5, "r_x1": 308.3, "r_y1": 471.5, "r_x2": 308.3, "r_y2": 468.8, "r_x3": 306.4, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 471.5, "r_x1": 347.5, "r_y1": 471.5, "r_x2": 347.5, "r_y2": 468.8, "r_x3": 345.5, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 471.5, "r_x1": 358.5, "r_y1": 471.5, "r_x2": 358.5, "r_y2": 468.8, "r_x3": 356.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 471.5, "r_x1": 369.6, "r_y1": 471.5, "r_x2": 369.6, "r_y2": 468.8, "r_x3": 367.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 471.5, "r_x1": 384.6, "r_y1": 471.5, "r_x2": 384.6, "r_y2": 468.8, "r_x3": 382.7, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 476.4, "r_x1": 206.5, "r_y1": 476.4, "r_x2": 206.5, "r_y2": 473.7, "r_x3": 200.6, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 476.4, "r_x1": 266.3, "r_y1": 476.4, "r_x2": 266.3, "r_y2": 473.7, "r_x3": 264.3, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 481.3, "r_x1": 206.5, "r_y1": 481.3, "r_x2": 206.5, "r_y2": 478.5, "r_x3": 200.6, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 481.3, "r_x1": 245.2, "r_y1": 481.3, "r_x2": 245.2, "r_y2": 478.5, "r_x3": 243.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 481.3, "r_x1": 266.3, "r_y1": 481.3, "r_x2": 266.3, "r_y2": 478.5, "r_x3": 264.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.3, "r_x1": 325.4, "r_y1": 481.3, "r_x2": 325.4, "r_y2": 478.5, "r_x3": 323.4, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 481.3, "r_x1": 399.7, "r_y1": 481.3, "r_x2": 399.7, "r_y2": 478.5, "r_x3": 397.7, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 486.1, "r_x1": 206.5, "r_y1": 486.1, "r_x2": 206.5, "r_y2": 483.4, "r_x3": 200.6, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 486.1, "r_x1": 384.6, "r_y1": 486.1, "r_x2": 384.6, "r_y2": 483.4, "r_x3": 382.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 486.1, "r_x1": 401.6, "r_y1": 486.1, "r_x2": 401.6, "r_y2": 483.4, "r_x3": 397.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 486.1, "r_x1": 414.7, "r_y1": 486.1, "r_x2": 414.7, "r_y2": 483.4, "r_x3": 412.8, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 491.0, "r_x1": 207.1, "r_y1": 491.0, "r_x2": 207.1, "r_y2": 488.3, "r_x3": 200.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 491.0, "r_x1": 369.8, "r_y1": 491.0, "r_x2": 369.8, "r_y2": 488.3, "r_x3": 367.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 491.0, "r_x1": 384.8, "r_y1": 491.0, "r_x2": 384.8, "r_y2": 488.3, "r_x3": 382.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 491.0, "r_x1": 402.1, "r_y1": 491.0, "r_x2": 402.1, "r_y2": 488.3, "r_x3": 397.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 495.9, "r_x1": 208.5, "r_y1": 495.9, "r_x2": 208.5, "r_y2": 493.2, "r_x3": 200.6, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 495.9, "r_x1": 266.3, "r_y1": 495.9, "r_x2": 266.3, "r_y2": 493.2, "r_x3": 264.3, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 58, "label": "text", "bbox": { "l": 180.1, "t": 516.2, "r": 190.6, "b": 518.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 518.9, "r_x1": 190.6, "r_y1": 518.9, "r_x2": 190.6, "r_y2": 516.2, "r_x3": 180.1, "r_y3": 516.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 183.2, "t": 520.1, "r": 304.5, "b": 522.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 522.8, "r_x1": 304.5, "r_y1": 522.8, "r_x2": 304.5, "r_y2": 520.1, "r_x3": 183.2, "r_y3": 520.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.2, "t": 524.0, "r": 388.4, "b": 526.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 526.7, "r_x1": 388.4, "r_y1": 526.7, "r_x2": 388.4, "r_y2": 524.0, "r_x3": 183.2, "r_y3": 524.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 183.2, "t": 527.9, "r": 388.4, "b": 530.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 530.6, "r_x1": 388.4, "r_y1": 530.6, "r_x2": 388.4, "r_y2": 527.9, "r_x3": 183.2, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 183.2, "t": 531.8, "r": 388.4, "b": 534.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 534.5, "r_x1": 388.4, "r_y1": 534.5, "r_x2": 388.4, "r_y2": 531.8, "r_x3": 183.2, "r_y3": 531.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 183.2, "t": 535.7, "r": 388.4, "b": 538.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 538.4, "r_x1": 388.4, "r_y1": 538.4, "r_x2": 388.4, "r_y2": 535.7, "r_x3": 183.2, "r_y3": 535.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 183.2, "t": 539.6, "r": 388.4, "b": 542.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 542.3, "r_x1": 388.4, "r_y1": 542.3, "r_x2": 388.4, "r_y2": 539.6, "r_x3": 183.2, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 183.2, "t": 543.5, "r": 388.4, "b": 546.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 546.2, "r_x1": 388.4, "r_y1": 546.2, "r_x2": 388.4, "r_y2": 543.5, "r_x3": 183.2, "r_y3": 543.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 183.2, "t": 547.4, "r": 388.4, "b": 550.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 550.1, "r_x1": 388.4, "r_y1": 550.1, "r_x2": 388.4, "r_y2": 547.4, "r_x3": 183.2, "r_y3": 547.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.2, "t": 551.3, "r": 388.4, "b": 554.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 554.0, "r_x1": 388.4, "r_y1": 554.0, "r_x2": 388.4, "r_y2": 551.3, "r_x3": 183.2, "r_y3": 551.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 180.1, "t": 555.2, "r": 191.9, "b": 557.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 557.9, "r_x1": 191.9, "r_y1": 557.9, "r_x2": 191.9, "r_y2": 555.2, "r_x3": 180.1, "r_y3": 555.2, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 407.4, "t": 518.3, "r": 408.8, "b": 521.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 521.0, "r_x1": 408.8, "r_y1": 521.0, "r_x2": 408.8, "r_y2": 518.3, "r_x3": 407.4, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 410.3, "t": 518.3, "r": 450.5, "b": 521.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 521.0, "r_x1": 450.5, "r_y1": 521.0, "r_x2": 450.5, "r_y2": 518.3, "r_x3": 410.3, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 407.4, "t": 522.2, "r": 408.8, "b": 524.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 524.9, "r_x1": 408.8, "r_y1": 524.9, "r_x2": 408.8, "r_y2": 522.2, "r_x3": 407.4, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 410.3, "t": 522.2, "r": 450.5, "b": 524.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 524.9, "r_x1": 450.5, "r_y1": 524.9, "r_x2": 450.5, "r_y2": 522.2, "r_x3": 410.3, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 407.4, "t": 526.1, "r": 408.8, "b": 528.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 528.8, "r_x1": 408.8, "r_y1": 528.8, "r_x2": 408.8, "r_y2": 526.1, "r_x3": 407.4, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 410.3, "t": 526.1, "r": 450.5, "b": 528.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 528.8, "r_x1": 450.5, "r_y1": 528.8, "r_x2": 450.5, "r_y2": 526.1, "r_x3": 410.3, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 407.4, "t": 530.0, "r": 408.8, "b": 532.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 532.7, "r_x1": 408.8, "r_y1": 532.7, "r_x2": 408.8, "r_y2": 530.0, "r_x3": 407.4, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 410.3, "t": 530.0, "r": 450.5, "b": 532.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 532.7, "r_x1": 450.5, "r_y1": 532.7, "r_x2": 450.5, "r_y2": 530.0, "r_x3": 410.3, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 407.4, "t": 533.9, "r": 408.8, "b": 536.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 536.6, "r_x1": 408.8, "r_y1": 536.6, "r_x2": 408.8, "r_y2": 533.9, "r_x3": 407.4, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 410.3, "t": 533.9, "r": 450.5, "b": 536.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 536.6, "r_x1": 450.5, "r_y1": 536.6, "r_x2": 450.5, "r_y2": 533.9, "r_x3": 410.3, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 407.4, "t": 537.8, "r": 408.8, "b": 540.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 540.5, "r_x1": 408.8, "r_y1": 540.5, "r_x2": 408.8, "r_y2": 537.8, "r_x3": 407.4, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 410.3, "t": 537.8, "r": 450.5, "b": 540.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 540.5, "r_x1": 450.5, "r_y1": 540.5, "r_x2": 450.5, "r_y2": 537.8, "r_x3": 410.3, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 407.4, "t": 541.7, "r": 408.8, "b": 544.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 544.4, "r_x1": 408.8, "r_y1": 544.4, "r_x2": 408.8, "r_y2": 541.7, "r_x3": 407.4, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 410.3, "t": 541.7, "r": 450.5, "b": 544.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 544.4, "r_x1": 450.5, "r_y1": 544.4, "r_x2": 450.5, "r_y2": 541.7, "r_x3": 410.3, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 407.4, "t": 545.6, "r": 408.8, "b": 548.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 548.3, "r_x1": 408.8, "r_y1": 548.3, "r_x2": 408.8, "r_y2": 545.6, "r_x3": 407.4, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 410.3, "t": 545.6, "r": 450.5, "b": 548.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 548.3, "r_x1": 450.5, "r_y1": 548.3, "r_x2": 450.5, "r_y2": 545.6, "r_x3": 410.3, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 407.4, "t": 549.5, "r": 408.8, "b": 552.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 552.2, "r_x1": 408.8, "r_y1": 552.2, "r_x2": 408.8, "r_y2": 549.5, "r_x3": 407.4, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 410.3, "t": 549.5, "r": 450.5, "b": 552.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 552.2, "r_x1": 450.5, "r_y1": 552.2, "r_x2": 450.5, "r_y2": 549.5, "r_x3": 410.3, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 164.5, "t": 509.5, "r": 181.9, "b": 515.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.5, "r_y0": 515.3, "r_x1": 181.9, "r_y1": 515.3, "r_x2": 181.9, "r_y2": 509.5, "r_x3": 164.5, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.6, "t": 509.5, "r": 186.4, "b": 515.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.6, "r_y0": 515.3, "r_x1": 186.4, "r_y1": 515.3, "r_x2": 186.4, "r_y2": 509.5, "r_x3": 183.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 189.2, "t": 509.5, "r": 208.9, "b": 515.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2, "r_y0": 515.3, "r_x1": 208.9, "r_y1": 515.3, "r_x2": 208.9, "r_y2": 509.5, "r_x3": 189.2, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 210.6, "t": 509.5, "r": 221.0, "b": 515.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.6, "r_y0": 515.3, "r_x1": 221.0, "r_y1": 515.3, "r_x2": 221.0, "r_y2": 509.5, "r_x3": 210.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 390.2, "t": 509.6, "r": 406.8, "b": 515.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.5, "r_x1": 406.8, "r_y1": 515.5, "r_x2": 406.8, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 408.6, "t": 509.6, "r": 411.4, "b": 515.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.6, "r_y0": 515.5, "r_x1": 411.4, "r_y1": 515.5, "r_x2": 411.4, "r_y2": 509.6, "r_x3": 408.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 414.2, "t": 509.6, "r": 433.9, "b": 515.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.5, "r_x1": 433.9, "r_y1": 515.5, "r_x2": 433.9, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 435.6, "t": 509.6, "r": 446.0, "b": 515.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 515.5, "r_x1": 446.0, "r_y1": 515.5, "r_x2": 446.0, "r_y2": 509.6, "r_x3": 435.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 167.2, "t": 519.1, "r": 172.8, "b": 526.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.2, "r_y0": 526.4, "r_x1": 172.8, "r_y1": 526.4, "r_x2": 172.8, "r_y2": 519.1, "r_x3": 167.2, "r_y3": 519.1, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 187.3, "t": 448.6, "r": 193.0, "b": 455.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.3, "r_y0": 455.9, "r_x1": 193.0, "r_y1": 455.9, "r_x2": 193.0, "r_y2": 448.6, "r_x3": 187.3, "r_y3": 448.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 167.4, "t": 566.0, "r": 173.0, "b": 573.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.4, "r_y0": 573.3, "r_x1": 173.0, "r_y1": 573.3, "r_x2": 173.0, "r_y2": 566.0, "r_x3": 167.4, "r_y3": 566.0, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 248.5, "t": 621.8, "r": 253.7, "b": 629.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.5, "r_y0": 629.1, "r_x1": 253.7, "r_y1": 629.1, "r_x2": 253.7, "r_y2": 621.8, "r_x3": 248.5, "r_y3": 621.8, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 395.9, "t": 519.2, "r": 401.5, "b": 526.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.5, "r_x1": 401.5, "r_y1": 526.5, "r_x2": 401.5, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 171.6, "t": 580.3, "r": 177.5, "b": 597.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.6, "r_y0": 597.3, "r_x1": 177.5, "r_y1": 597.3, "r_x2": 177.5, "r_y2": 580.3, "r_x3": 171.6, "r_y3": 580.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 251.1, "t": 633.6, "r": 256.9, "b": 649.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.1, "r_y0": 649.9, "r_x1": 256.9, "r_y1": 649.9, "r_x2": 256.9, "r_y2": 633.6, "r_x3": 251.1, "r_y3": 633.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 372.1, "t": 601.5, "r": 427.0, "b": 607.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 607.3, "r_x1": 427.0, "r_y1": 607.3, "r_x2": 427.0, "r_y2": 601.5, "r_x3": 372.1, "r_y3": 601.5, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 372.1, "t": 607.9, "r": 430.1, "b": 613.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 613.8, "r_x1": 430.1, "r_y1": 613.8, "r_x2": 430.1, "r_y2": 607.9, "r_x3": 372.1, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 176.9, "t": 642.9, "r": 231.1, "b": 648.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 648.7, "r_x1": 231.1, "r_y1": 648.7, "r_x2": 231.1, "r_y2": 642.9, "r_x3": 176.9, "r_y3": 642.9, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 176.9, "t": 649.3, "r": 231.0, "b": 655.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 655.2, "r_x1": 231.0, "r_y1": 655.2, "r_x2": 231.0, "r_y2": 649.3, "r_x3": 176.9, "r_y3": 649.3, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 176.9, "t": 655.8, "r": 203.9, "b": 661.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 661.6, "r_x1": 203.9, "r_y1": 661.6, "r_x2": 203.9, "r_y2": 655.8, "r_x3": 176.9, "r_y3": 655.8, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 215.9, "t": 557.6, "r": 218.5, "b": 569.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.9, "r_y0": 569.2, "r_x1": 218.5, "r_y1": 569.2, "r_x2": 218.5, "r_y2": 557.6, "r_x3": 215.9, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 229.1, "t": 557.6, "r": 231.7, "b": 569.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.1, "r_y0": 569.2, "r_x1": 231.7, "r_y1": 569.2, "r_x2": 231.7, "r_y2": 557.6, "r_x3": 229.1, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 261.2, "t": 448.5, "r": 263.6, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.2, "r_y0": 451.2, "r_x1": 263.6, "r_y1": 451.2, "r_x2": 263.6, "r_y2": 448.5, "r_x3": 261.2, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 312.3, "t": 448.5, "r": 313.6, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.3, "r_y0": 451.2, "r_x1": 313.6, "r_y1": 451.2, "r_x2": 313.6, "r_y2": 448.5, "r_x3": 312.3, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 377.4, "t": 448.5, "r": 380.1, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.4, "r_y0": 451.2, "r_x1": 380.1, "r_y1": 451.2, "r_x2": 380.1, "r_y2": 448.5, "r_x3": 377.4, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 200.6, "t": 453.3, "r": 205.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 456.1, "r_x1": 205.8, "r_y1": 456.1, "r_x2": 205.8, "r_y2": 453.3, "r_x3": 200.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 222.2, "t": 453.3, "r": 229.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.2, "r_y0": 456.1, "r_x1": 229.8, "r_y1": 456.1, "r_x2": 229.8, "r_y2": 453.3, "r_x3": 222.2, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 243.3, "t": 453.3, "r": 250.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 456.1, "r_x1": 250.8, "r_y1": 456.1, "r_x2": 250.8, "r_y2": 453.3, "r_x3": 243.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 264.3, "t": 453.3, "r": 271.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.1, "r_x1": 271.8, "r_y1": 456.1, "r_x2": 271.8, "r_y2": 453.3, "r_x3": 264.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 285.3, "t": 453.3, "r": 292.9, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.3, "r_y0": 456.1, "r_x1": 292.9, "r_y1": 456.1, "r_x2": 292.9, "r_y2": 453.3, "r_x3": 285.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 306.4, "t": 453.3, "r": 311.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 456.1, "r_x1": 311.8, "r_y1": 456.1, "r_x2": 311.8, "r_y2": 453.3, "r_x3": 306.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 323.4, "t": 453.3, "r": 325.6, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 456.1, "r_x1": 325.6, "r_y1": 456.1, "r_x2": 325.6, "r_y2": 453.3, "r_x3": 323.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 334.5, "t": 453.3, "r": 336.6, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 456.1, "r_x1": 336.6, "r_y1": 456.1, "r_x2": 336.6, "r_y2": 453.3, "r_x3": 334.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 345.5, "t": 453.3, "r": 347.7, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 456.1, "r_x1": 347.7, "r_y1": 456.1, "r_x2": 347.7, "r_y2": 453.3, "r_x3": 345.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 356.6, "t": 453.3, "r": 358.7, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 456.1, "r_x1": 358.7, "r_y1": 456.1, "r_x2": 358.7, "r_y2": 453.3, "r_x3": 356.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 367.6, "t": 453.3, "r": 372.0, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 456.1, "r_x1": 372.0, "r_y1": 456.1, "r_x2": 372.0, "r_y2": 453.3, "r_x3": 367.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 382.7, "t": 453.3, "r": 387.0, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 456.1, "r_x1": 387.0, "r_y1": 456.1, "r_x2": 387.0, "r_y2": 453.3, "r_x3": 382.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 397.7, "t": 453.3, "r": 402.1, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 456.1, "r_x1": 402.1, "r_y1": 456.1, "r_x2": 402.1, "r_y2": 453.3, "r_x3": 397.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 412.8, "t": 448.0, "r": 414.9, "b": 457.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 457.8, "r_x1": 414.9, "r_y1": 457.8, "r_x2": 414.9, "r_y2": 448.0, "r_x3": 412.8, "r_y3": 448.0, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 415.0, "t": 453.3, "r": 422.5, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.0, "r_y0": 456.1, "r_x1": 422.5, "r_y1": 456.1, "r_x2": 422.5, "r_y2": 453.3, "r_x3": 415.0, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 200.6, "t": 463.9, "r": 204.6, "b": 466.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 466.7, "r_x1": 204.6, "r_y1": 466.7, "r_x2": 204.6, "r_y2": 463.9, "r_x3": 200.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 367.6, "t": 463.9, "r": 369.6, "b": 466.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 466.7, "r_x1": 369.6, "r_y1": 466.7, "r_x2": 369.6, "r_y2": 463.9, "r_x3": 367.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 382.7, "t": 463.9, "r": 384.6, "b": 466.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 466.7, "r_x1": 384.6, "r_y1": 466.7, "r_x2": 384.6, "r_y2": 463.9, "r_x3": 382.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 397.7, "t": 463.9, "r": 399.7, "b": 466.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 466.7, "r_x1": 399.7, "r_y1": 466.7, "r_x2": 399.7, "r_y2": 463.9, "r_x3": 397.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 200.6, "t": 468.8, "r": 206.5, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 471.5, "r_x1": 206.5, "r_y1": 471.5, "r_x2": 206.5, "r_y2": 468.8, "r_x3": 200.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 264.3, "t": 468.8, "r": 266.3, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 471.5, "r_x1": 266.3, "r_y1": 471.5, "r_x2": 266.3, "r_y2": 468.8, "r_x3": 264.3, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 306.4, "t": 468.8, "r": 308.3, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 471.5, "r_x1": 308.3, "r_y1": 471.5, "r_x2": 308.3, "r_y2": 468.8, "r_x3": 306.4, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 345.5, "t": 468.8, "r": 347.5, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 471.5, "r_x1": 347.5, "r_y1": 471.5, "r_x2": 347.5, "r_y2": 468.8, "r_x3": 345.5, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 356.6, "t": 468.8, "r": 358.5, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 471.5, "r_x1": 358.5, "r_y1": 471.5, "r_x2": 358.5, "r_y2": 468.8, "r_x3": 356.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 367.6, "t": 468.8, "r": 369.6, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 471.5, "r_x1": 369.6, "r_y1": 471.5, "r_x2": 369.6, "r_y2": 468.8, "r_x3": 367.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 382.7, "t": 468.8, "r": 384.6, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 471.5, "r_x1": 384.6, "r_y1": 471.5, "r_x2": 384.6, "r_y2": 468.8, "r_x3": 382.7, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 200.6, "t": 473.7, "r": 206.5, "b": 476.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 476.4, "r_x1": 206.5, "r_y1": 476.4, "r_x2": 206.5, "r_y2": 473.7, "r_x3": 200.6, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 264.3, "t": 473.7, "r": 266.3, "b": 476.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 476.4, "r_x1": 266.3, "r_y1": 476.4, "r_x2": 266.3, "r_y2": 473.7, "r_x3": 264.3, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 200.6, "t": 478.5, "r": 206.5, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 481.3, "r_x1": 206.5, "r_y1": 481.3, "r_x2": 206.5, "r_y2": 478.5, "r_x3": 200.6, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 243.3, "t": 478.5, "r": 245.2, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 481.3, "r_x1": 245.2, "r_y1": 481.3, "r_x2": 245.2, "r_y2": 478.5, "r_x3": 243.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 264.3, "t": 478.5, "r": 266.3, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 481.3, "r_x1": 266.3, "r_y1": 481.3, "r_x2": 266.3, "r_y2": 478.5, "r_x3": 264.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 323.4, "t": 478.5, "r": 325.4, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.3, "r_x1": 325.4, "r_y1": 481.3, "r_x2": 325.4, "r_y2": 478.5, "r_x3": 323.4, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 397.7, "t": 478.5, "r": 399.7, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 481.3, "r_x1": 399.7, "r_y1": 481.3, "r_x2": 399.7, "r_y2": 478.5, "r_x3": 397.7, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 200.6, "t": 483.4, "r": 206.5, "b": 486.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 486.1, "r_x1": 206.5, "r_y1": 486.1, "r_x2": 206.5, "r_y2": 483.4, "r_x3": 200.6, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 382.7, "t": 483.4, "r": 384.6, "b": 486.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 486.1, "r_x1": 384.6, "r_y1": 486.1, "r_x2": 384.6, "r_y2": 483.4, "r_x3": 382.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 397.7, "t": 483.4, "r": 401.6, "b": 486.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 486.1, "r_x1": 401.6, "r_y1": 486.1, "r_x2": 401.6, "r_y2": 483.4, "r_x3": 397.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 412.8, "t": 483.4, "r": 414.7, "b": 486.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 486.1, "r_x1": 414.7, "r_y1": 486.1, "r_x2": 414.7, "r_y2": 483.4, "r_x3": 412.8, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 200.6, "t": 488.3, "r": 207.1, "b": 491.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 491.0, "r_x1": 207.1, "r_y1": 491.0, "r_x2": 207.1, "r_y2": 488.3, "r_x3": 200.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 367.6, "t": 488.3, "r": 369.8, "b": 491.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 491.0, "r_x1": 369.8, "r_y1": 491.0, "r_x2": 369.8, "r_y2": 488.3, "r_x3": 367.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 382.7, "t": 488.3, "r": 384.8, "b": 491.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 491.0, "r_x1": 384.8, "r_y1": 491.0, "r_x2": 384.8, "r_y2": 488.3, "r_x3": 382.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 397.7, "t": 488.3, "r": 402.1, "b": 491.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 491.0, "r_x1": 402.1, "r_y1": 491.0, "r_x2": 402.1, "r_y2": 488.3, "r_x3": 397.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 200.6, "t": 493.2, "r": 208.5, "b": 495.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 495.9, "r_x1": 208.5, "r_y1": 495.9, "r_x2": 208.5, "r_y2": 493.2, "r_x3": 200.6, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 264.3, "t": 493.2, "r": 266.3, "b": 495.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 495.9, "r_x1": 266.3, "r_y1": 495.9, "r_x2": 266.3, "r_y2": 493.2, "r_x3": 264.3, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 155, "page_no": 9, "cluster": { "id": 155, "label": "text", "bbox": { "l": 227.9, "t": 665.8, "r": 230.1, "b": 675.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.9, "r_y0": 675.3, "r_x1": 230.1, "r_y1": 675.3, "r_x2": 230.1, "r_y2": 665.8, "r_x3": 227.9, "r_y3": 665.8, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u03bc" }, { "label": "text", "id": 156, "page_no": 9, "cluster": { "id": 156, "label": "text", "bbox": { "l": 300.6, "t": 683.6, "r": 302.7, "b": 693.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.6, "r_y0": 693.4, "r_x1": 302.7, "r_y1": 693.4, "r_x2": 302.7, "r_y2": 683.6, "r_x3": 300.6, "r_y3": 683.6, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u2265" } ], "body": [ { "label": "caption", "id": 4, "page_no": 9, "cluster": { "id": 4, "label": "caption", "bbox": { "l": 134.8, "t": 115.8, "r": 480.6, "b": 145.9, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 123.8, "r_x1": 173.1, "r_y1": 123.8, "r_x2": 173.1, "r_y2": 115.8, "r_x3": 134.8, "r_y3": 115.8, "coord_origin": "TOPLEFT" }, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.3, "r_y0": 124.0, "r_x1": 480.6, "r_y1": 124.0, "r_x2": 480.6, "r_y2": 115.9, "r_x3": 181.3, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 134.9, "r_x1": 480.6, "r_y1": 134.9, "r_x2": 480.6, "r_y2": 126.9, "r_x3": 134.8, "r_y3": 126.9, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 145.9, "r_x1": 306.0, "r_y1": 145.9, "r_x2": 306.0, "r_y2": 137.8, "r_x3": 134.8, "r_y3": 137.8, "coord_origin": "TOPLEFT" }, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 2. TSR and cell detection results compared between OTSL and HTML on the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using TableFormer [9] (with enc=6, dec=6, heads=8)." }, { "label": "table", "id": 0, "page_no": 9, "cluster": { "id": 0, "label": "table", "bbox": { "l": 143.6, "t": 156.3, "r": 470.8, "b": 263.3, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.8, "r_y0": 174.6, "r_x1": 195.0, "r_y1": 174.6, "r_x2": 195.0, "r_y2": 166.6, "r_x3": 160.8, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.5, "r_y0": 174.6, "r_x1": 254.0, "r_y1": 174.6, "r_x2": 254.0, "r_y2": 166.5, "r_x3": 215.5, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.1, "r_x1": 324.0, "r_y1": 169.1, "r_x2": 324.0, "r_y2": 161.1, "r_x3": 300.4, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.3, "r_y0": 174.6, "r_x1": 414.7, "r_y1": 174.6, "r_x2": 414.7, "r_y2": 166.6, "r_x3": 370.3, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.7, "r_y0": 169.1, "r_x1": 463.1, "r_y1": 169.1, "r_x2": 463.1, "r_y2": 161.1, "r_x3": 426.7, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.1, "r_y0": 180.1, "r_x1": 466.7, "r_y1": 180.1, "r_x2": 466.7, "r_y2": 172.0, "r_x3": 423.1, "r_y3": 172.0, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.4, "r_y0": 182.1, "r_x1": 288.1, "r_y1": 182.1, "r_x2": 288.1, "r_y2": 174.0, "r_x3": 262.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.4, "r_y0": 182.1, "r_x1": 329.4, "r_y1": 182.1, "r_x2": 329.4, "r_y2": 174.0, "r_x3": 296.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.0, "r_y0": 182.1, "r_x1": 354.8, "r_y1": 182.1, "r_x2": 354.8, "r_y2": 174.0, "r_x3": 345.0, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 200.9, "r_x1": 201.2, "r_y1": 200.9, "r_x2": 201.2, "r_y2": 192.9, "r_x3": 154.5, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 195.5, "r_x1": 247.1, "r_y1": 195.5, "r_x2": 247.1, "r_y2": 187.4, "r_x3": 222.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 195.5, "r_x1": 285.7, "r_y1": 195.5, "r_x2": 285.7, "r_y2": 187.4, "r_x3": 264.7, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 195.5, "r_x1": 323.4, "r_y1": 195.5, "r_x2": 323.4, "r_y2": 187.4, "r_x3": 302.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.5, "r_x1": 360.4, "r_y1": 195.5, "r_x2": 360.4, "r_y2": 187.4, "r_x3": 339.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.1, "r_y0": 195.2, "r_x1": 402.0, "r_y1": 195.2, "r_x2": 402.0, "r_y2": 187.3, "r_x3": 383.1, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 195.2, "r_x1": 454.4, "r_y1": 195.2, "r_x2": 454.4, "r_y2": 187.3, "r_x3": 435.5, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.7, "r_y1": 208.4, "r_x2": 248.7, "r_y2": 200.3, "r_x3": 220.9, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 208.4, "r_x1": 285.7, "r_y1": 208.4, "r_x2": 285.7, "r_y2": 200.3, "r_x3": 264.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 208.4, "r_x1": 323.4, "r_y1": 208.4, "r_x2": 323.4, "r_y2": 200.3, "r_x3": 302.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.4, "r_y1": 208.4, "r_x2": 360.4, "r_y2": 200.3, "r_x3": 339.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 208.4, "r_x1": 403.0, "r_y1": 208.4, "r_x2": 403.0, "r_y2": 200.3, "r_x3": 382.1, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 208.4, "r_x1": 453.1, "r_y1": 208.4, "r_x2": 453.1, "r_y2": 200.3, "r_x3": 436.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.9, "r_y0": 227.2, "r_x1": 199.8, "r_y1": 227.2, "r_x2": 199.8, "r_y2": 219.2, "r_x3": 155.9, "r_y3": 219.2, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 221.8, "r_x1": 247.1, "r_y1": 221.8, "r_x2": 247.1, "r_y2": 213.7, "r_x3": 222.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 221.8, "r_x1": 285.7, "r_y1": 221.8, "r_x2": 285.7, "r_y2": 213.7, "r_x3": 264.7, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 221.8, "r_x1": 323.4, "r_y1": 221.8, "r_x2": 323.4, "r_y2": 213.7, "r_x3": 302.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 221.5, "r_x1": 362.0, "r_y1": 221.5, "r_x2": 362.0, "r_y2": 213.6, "r_x3": 337.8, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 221.5, "r_x1": 404.6, "r_y1": 221.5, "r_x2": 404.6, "r_y2": 213.6, "r_x3": 380.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 221.5, "r_x1": 454.4, "r_y1": 221.5, "r_x2": 454.4, "r_y2": 213.6, "r_x3": 435.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.7, "r_y1": 234.7, "r_x2": 248.7, "r_y2": 226.6, "r_x3": 220.9, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 234.7, "r_x1": 285.7, "r_y1": 234.7, "r_x2": 285.7, "r_y2": 226.6, "r_x3": 264.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 234.7, "r_x1": 323.4, "r_y1": 234.7, "r_x2": 323.4, "r_y2": 226.6, "r_x3": 302.4, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.7, "r_y0": 234.7, "r_x1": 358.1, "r_y1": 234.7, "r_x2": 358.1, "r_y2": 226.6, "r_x3": 341.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 234.7, "r_x1": 403.0, "r_y1": 234.7, "r_x2": 403.0, "r_y2": 226.6, "r_x3": 382.1, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 234.7, "r_x1": 453.1, "r_y1": 234.7, "r_x2": 453.1, "r_y2": 226.6, "r_x3": 436.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.6, "r_y0": 253.5, "r_x1": 207.2, "r_y1": 253.5, "r_x2": 207.2, "r_y2": 245.5, "r_x3": 148.6, "r_y3": 245.5, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 248.1, "r_x1": 247.1, "r_y1": 248.1, "r_x2": 247.1, "r_y2": 240.0, "r_x3": 222.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 248.1, "r_x1": 285.7, "r_y1": 248.1, "r_x2": 285.7, "r_y2": 240.0, "r_x3": 264.7, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 248.1, "r_x1": 323.4, "r_y1": 248.1, "r_x2": 323.4, "r_y2": 240.0, "r_x3": 302.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 247.8, "r_x1": 362.0, "r_y1": 247.8, "r_x2": 362.0, "r_y2": 239.9, "r_x3": 337.8, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 247.8, "r_x1": 404.6, "r_y1": 247.8, "r_x2": 404.6, "r_y2": 239.9, "r_x3": 380.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 247.8, "r_x1": 454.4, "r_y1": 247.8, "r_x2": 454.4, "r_y2": 239.9, "r_x3": 435.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.7, "r_y1": 261.0, "r_x2": 248.7, "r_y2": 252.9, "r_x3": 220.9, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 261.0, "r_x1": 285.7, "r_y1": 261.0, "r_x2": 285.7, "r_y2": 252.9, "r_x3": 264.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 261.0, "r_x1": 323.4, "r_y1": 261.0, "r_x2": 323.4, "r_y2": 252.9, "r_x3": 302.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.4, "r_y1": 261.0, "r_x2": 360.4, "r_y2": 252.9, "r_x3": 339.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 261.0, "r_x1": 403.0, "r_y1": 261.0, "r_x2": 403.0, "r_y2": 252.9, "r_x3": 382.1, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 261.0, "r_x1": 453.1, "r_y1": 261.0, "r_x2": 453.1, "r_y2": 252.9, "r_x3": 436.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 10, "label": "text", "bbox": { "l": 160.8, "t": 166.6, "r": 195.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.8, "r_y0": 174.6, "r_x1": 195.0, "r_y1": 174.6, "r_x2": 195.0, "r_y2": 166.6, "r_x3": 160.8, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 215.5, "t": 166.5, "r": 254.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.5, "r_y0": 174.6, "r_x1": 254.0, "r_y1": 174.6, "r_x2": 254.0, "r_y2": 166.5, "r_x3": 215.5, "r_y3": 166.5, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 300.4, "t": 161.1, "r": 324.0, "b": 169.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.1, "r_x1": 324.0, "r_y1": 169.1, "r_x2": 324.0, "r_y2": 161.1, "r_x3": 300.4, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 370.3, "t": 166.6, "r": 414.7, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.3, "r_y0": 174.6, "r_x1": 414.7, "r_y1": 174.6, "r_x2": 414.7, "r_y2": 166.6, "r_x3": 370.3, "r_y3": 166.6, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 426.7, "t": 161.1, "r": 463.1, "b": 169.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.7, "r_y0": 169.1, "r_x1": 463.1, "r_y1": 169.1, "r_x2": 463.1, "r_y2": 161.1, "r_x3": 426.7, "r_y3": 161.1, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 423.1, "t": 172.0, "r": 466.7, "b": 180.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.1, "r_y0": 180.1, "r_x1": 466.7, "r_y1": 180.1, "r_x2": 466.7, "r_y2": 172.0, "r_x3": 423.1, "r_y3": 172.0, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 262.4, "t": 174.0, "r": 288.1, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.4, "r_y0": 182.1, "r_x1": 288.1, "r_y1": 182.1, "r_x2": 288.1, "r_y2": 174.0, "r_x3": 262.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 296.4, "t": 174.0, "r": 329.4, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.4, "r_y0": 182.1, "r_x1": 329.4, "r_y1": 182.1, "r_x2": 329.4, "r_y2": 174.0, "r_x3": 296.4, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 345.0, "t": 174.0, "r": 354.8, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.0, "r_y0": 182.1, "r_x1": 354.8, "r_y1": 182.1, "r_x2": 354.8, "r_y2": 174.0, "r_x3": 345.0, "r_y3": 174.0, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 154.5, "t": 192.9, "r": 201.2, "b": 200.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.5, "r_y0": 200.9, "r_x1": 201.2, "r_y1": 200.9, "r_x2": 201.2, "r_y2": 192.9, "r_x3": 154.5, "r_y3": 192.9, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 222.4, "t": 187.4, "r": 247.1, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 195.5, "r_x1": 247.1, "r_y1": 195.5, "r_x2": 247.1, "r_y2": 187.4, "r_x3": 222.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 264.7, "t": 187.4, "r": 285.7, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 195.5, "r_x1": 285.7, "r_y1": 195.5, "r_x2": 285.7, "r_y2": 187.4, "r_x3": 264.7, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 302.4, "t": 187.4, "r": 323.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 195.5, "r_x1": 323.4, "r_y1": 195.5, "r_x2": 323.4, "r_y2": 187.4, "r_x3": 302.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 339.4, "t": 187.4, "r": 360.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.5, "r_x1": 360.4, "r_y1": 195.5, "r_x2": 360.4, "r_y2": 187.4, "r_x3": 339.4, "r_y3": 187.4, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 383.1, "t": 187.3, "r": 402.0, "b": 195.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.1, "r_y0": 195.2, "r_x1": 402.0, "r_y1": 195.2, "r_x2": 402.0, "r_y2": 187.3, "r_x3": 383.1, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 435.5, "t": 187.3, "r": 454.4, "b": 195.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 195.2, "r_x1": 454.4, "r_y1": 195.2, "r_x2": 454.4, "r_y2": 187.3, "r_x3": 435.5, "r_y3": 187.3, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 220.9, "t": 200.3, "r": 248.7, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.7, "r_y1": 208.4, "r_x2": 248.7, "r_y2": 200.3, "r_x3": 220.9, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 264.7, "t": 200.3, "r": 285.7, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 208.4, "r_x1": 285.7, "r_y1": 208.4, "r_x2": 285.7, "r_y2": 200.3, "r_x3": 264.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 302.4, "t": 200.3, "r": 323.4, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 208.4, "r_x1": 323.4, "r_y1": 208.4, "r_x2": 323.4, "r_y2": 200.3, "r_x3": 302.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 339.4, "t": 200.3, "r": 360.4, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.4, "r_y1": 208.4, "r_x2": 360.4, "r_y2": 200.3, "r_x3": 339.4, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 382.1, "t": 200.3, "r": 403.0, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 208.4, "r_x1": 403.0, "r_y1": 208.4, "r_x2": 403.0, "r_y2": 200.3, "r_x3": 382.1, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 436.7, "t": 200.3, "r": 453.1, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 208.4, "r_x1": 453.1, "r_y1": 208.4, "r_x2": 453.1, "r_y2": 200.3, "r_x3": 436.7, "r_y3": 200.3, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 155.9, "t": 219.2, "r": 199.8, "b": 227.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.9, "r_y0": 227.2, "r_x1": 199.8, "r_y1": 227.2, "r_x2": 199.8, "r_y2": 219.2, "r_x3": 155.9, "r_y3": 219.2, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 222.4, "t": 213.7, "r": 247.1, "b": 221.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 221.8, "r_x1": 247.1, "r_y1": 221.8, "r_x2": 247.1, "r_y2": 213.7, "r_x3": 222.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 264.7, "t": 213.7, "r": 285.7, "b": 221.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 221.8, "r_x1": 285.7, "r_y1": 221.8, "r_x2": 285.7, "r_y2": 213.7, "r_x3": 264.7, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 302.4, "t": 213.7, "r": 323.4, "b": 221.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 221.8, "r_x1": 323.4, "r_y1": 221.8, "r_x2": 323.4, "r_y2": 213.7, "r_x3": 302.4, "r_y3": 213.7, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 337.8, "t": 213.6, "r": 362.0, "b": 221.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 221.5, "r_x1": 362.0, "r_y1": 221.5, "r_x2": 362.0, "r_y2": 213.6, "r_x3": 337.8, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 380.5, "t": 213.6, "r": 404.6, "b": 221.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 221.5, "r_x1": 404.6, "r_y1": 221.5, "r_x2": 404.6, "r_y2": 213.6, "r_x3": 380.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 435.5, "t": 213.6, "r": 454.4, "b": 221.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 221.5, "r_x1": 454.4, "r_y1": 221.5, "r_x2": 454.4, "r_y2": 213.6, "r_x3": 435.5, "r_y3": 213.6, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 220.9, "t": 226.6, "r": 248.7, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.7, "r_y1": 234.7, "r_x2": 248.7, "r_y2": 226.6, "r_x3": 220.9, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 264.7, "t": 226.6, "r": 285.7, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 234.7, "r_x1": 285.7, "r_y1": 234.7, "r_x2": 285.7, "r_y2": 226.6, "r_x3": 264.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 302.4, "t": 226.6, "r": 323.4, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 234.7, "r_x1": 323.4, "r_y1": 234.7, "r_x2": 323.4, "r_y2": 226.6, "r_x3": 302.4, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 341.7, "t": 226.6, "r": 358.1, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.7, "r_y0": 234.7, "r_x1": 358.1, "r_y1": 234.7, "r_x2": 358.1, "r_y2": 226.6, "r_x3": 341.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 382.1, "t": 226.6, "r": 403.0, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 234.7, "r_x1": 403.0, "r_y1": 234.7, "r_x2": 403.0, "r_y2": 226.6, "r_x3": 382.1, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 436.7, "t": 226.6, "r": 453.1, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 234.7, "r_x1": 453.1, "r_y1": 234.7, "r_x2": 453.1, "r_y2": 226.6, "r_x3": 436.7, "r_y3": 226.6, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 148.6, "t": 245.5, "r": 207.2, "b": 253.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.6, "r_y0": 253.5, "r_x1": 207.2, "r_y1": 253.5, "r_x2": 207.2, "r_y2": 245.5, "r_x3": 148.6, "r_y3": 245.5, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 222.4, "t": 240.0, "r": 247.1, "b": 248.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.4, "r_y0": 248.1, "r_x1": 247.1, "r_y1": 248.1, "r_x2": 247.1, "r_y2": 240.0, "r_x3": 222.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 264.7, "t": 240.0, "r": 285.7, "b": 248.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 248.1, "r_x1": 285.7, "r_y1": 248.1, "r_x2": 285.7, "r_y2": 240.0, "r_x3": 264.7, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 302.4, "t": 240.0, "r": 323.4, "b": 248.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 248.1, "r_x1": 323.4, "r_y1": 248.1, "r_x2": 323.4, "r_y2": 240.0, "r_x3": 302.4, "r_y3": 240.0, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 337.8, "t": 239.9, "r": 362.0, "b": 247.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.8, "r_y0": 247.8, "r_x1": 362.0, "r_y1": 247.8, "r_x2": 362.0, "r_y2": 239.9, "r_x3": 337.8, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 380.5, "t": 239.9, "r": 404.6, "b": 247.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.5, "r_y0": 247.8, "r_x1": 404.6, "r_y1": 247.8, "r_x2": 404.6, "r_y2": 239.9, "r_x3": 380.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 435.5, "t": 239.9, "r": 454.4, "b": 247.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.5, "r_y0": 247.8, "r_x1": 454.4, "r_y1": 247.8, "r_x2": 454.4, "r_y2": 239.9, "r_x3": 435.5, "r_y3": 239.9, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 220.9, "t": 252.9, "r": 248.7, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.7, "r_y1": 261.0, "r_x2": 248.7, "r_y2": 252.9, "r_x3": 220.9, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 264.7, "t": 252.9, "r": 285.7, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.7, "r_y0": 261.0, "r_x1": 285.7, "r_y1": 261.0, "r_x2": 285.7, "r_y2": 252.9, "r_x3": 264.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 302.4, "t": 252.9, "r": 323.4, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.4, "r_y0": 261.0, "r_x1": 323.4, "r_y1": 261.0, "r_x2": 323.4, "r_y2": 252.9, "r_x3": 302.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 339.4, "t": 252.9, "r": 360.4, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.4, "r_y1": 261.0, "r_x2": 360.4, "r_y2": 252.9, "r_x3": 339.4, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 382.1, "t": 252.9, "r": 403.0, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.1, "r_y0": 261.0, "r_x1": 403.0, "r_y1": 261.0, "r_x2": 403.0, "r_y2": 252.9, "r_x3": 382.1, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 436.7, "t": 252.9, "r": 453.1, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.7, "r_y0": 261.0, "r_x1": 453.1, "r_y1": 261.0, "r_x2": 453.1, "r_y2": 252.9, "r_x3": 436.7, "r_y3": 252.9, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ched", "ched", "ched", "ucel", "ucel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 7, "table_cells": [ { "bbox": { "l": 160.8, "t": 166.6, "r": 195.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Data set", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 215.5, "t": 166.5, "r": 254.0, "b": 174.6, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 300.4, "t": 161.1, "r": 324.0, "b": 169.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 5, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 370.3, "t": 166.6, "r": 414.7, "b": 174.6, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "mAP(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 426.7, "t": 161.1, "r": 463.1, "b": 169.1, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "Inference time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 262.4, "t": 174.0, "r": 288.1, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 296.4, "t": 174.0, "r": 329.4, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 345.0, "t": 174.0, "r": 354.8, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 154.5, "t": 192.9, "r": 201.2, "b": 200.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.4, "t": 187.4, "r": 247.1, "b": 195.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.7, "t": 187.4, "r": 285.7, "b": 195.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.4, "t": 187.4, "r": 323.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 339.4, "t": 187.4, "r": 360.4, "b": 195.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 383.1, "t": 187.3, "r": 402.0, "b": 195.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.5, "t": 187.3, "r": 454.4, "b": 195.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 155.9, "t": 219.2, "r": 199.8, "b": 227.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.4, "t": 213.7, "r": 247.1, "b": 221.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.7, "t": 213.7, "r": 285.7, "b": 221.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.955 0.917", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.4, "t": 213.7, "r": 323.4, "b": 221.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.961 0.922", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.8, "t": 213.6, "r": 362.0, "b": 221.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.959 0.92", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.5, "t": 213.6, "r": 404.6, "b": 221.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.862 0.722", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.5, "t": 213.6, "r": 454.4, "b": 221.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.85 3.26", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 148.6, "t": 245.5, "r": 207.2, "b": 253.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTables-1M", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.4, "t": 240.0, "r": 247.1, "b": 248.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.7, "t": 240.0, "r": 285.7, "b": 248.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.987 0.983", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.4, "t": 240.0, "r": 323.4, "b": 248.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.964 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.8, "t": 239.9, "r": 362.0, "b": 247.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.977 0.966", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.5, "t": 239.9, "r": 404.6, "b": 247.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.896 0.889", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.5, "t": 239.9, "r": 454.4, "b": 247.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.79 3.26", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "section_header", "id": 3, "page_no": 9, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.8, "t": 288.9, "r": 257.1, "b": 297.7, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 297.7, "r_x1": 149.4, "r_y1": 297.7, "r_x2": 149.4, "r_y2": 288.9, "r_x3": 134.8, "r_y3": 288.9, "coord_origin": "TOPLEFT" }, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.9, "r_y0": 297.7, "r_x1": 257.1, "r_y1": 297.7, "r_x2": 257.1, "r_y2": 288.9, "r_x3": 160.9, "r_y3": 288.9, "coord_origin": "TOPLEFT" }, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.3 Qualitative Results" }, { "label": "text", "id": 1, "page_no": 9, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 309.9, "r": 480.6, "b": 366.5, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 318.7, "r_x1": 480.6, "r_y1": 318.7, "r_x2": 480.6, "r_y2": 309.9, "r_x3": 134.8, "r_y3": 309.9, "coord_origin": "TOPLEFT" }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "orig": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 330.6, "r_x1": 480.6, "r_y1": 330.6, "r_x2": 480.6, "r_y2": 321.8, "r_x3": 134.8, "r_y3": 321.8, "coord_origin": "TOPLEFT" }, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 342.6, "r_x1": 480.6, "r_y1": 342.6, "r_x2": 480.6, "r_y2": 333.8, "r_x3": 134.8, "r_y3": 333.8, "coord_origin": "TOPLEFT" }, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 354.5, "r_x1": 480.6, "r_y1": 354.5, "r_x2": 480.6, "r_y2": 345.7, "r_x3": 134.8, "r_y3": 345.7, "coord_origin": "TOPLEFT" }, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 366.5, "r_x1": 161.7, "r_y1": 366.5, "r_x2": 161.7, "r_y2": 357.7, "r_x3": 134.8, "r_y3": 357.7, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5 demonstrates less overlap and more accurate bounding boxes with OTSL. In Figure 6, OTSL proves to be more effective in handling tables with longer token sequences, resulting in even more precise structure prediction and bounding boxes." }, { "label": "caption", "id": 5, "page_no": 9, "cluster": { "id": 5, "label": "caption", "bbox": { "l": 134.8, "t": 397.6, "r": 480.6, "b": 439.7, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 405.5, "r_x1": 162.6, "r_y1": 405.5, "r_x2": 162.6, "r_y2": 397.6, "r_x3": 134.8, "r_y3": 397.6, "coord_origin": "TOPLEFT" }, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.4, "r_y0": 405.7, "r_x1": 480.6, "r_y1": 405.7, "r_x2": 480.6, "r_y2": 397.7, "r_x3": 167.4, "r_y3": 397.7, "coord_origin": "TOPLEFT" }, "text": "The OTSL model produces more accurate bounding boxes with less over-", "orig": "The OTSL model produces more accurate bounding boxes with less over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 416.7, "r_x1": 480.6, "r_y1": 416.7, "r_x2": 480.6, "r_y2": 408.6, "r_x3": 134.8, "r_y3": 408.6, "coord_origin": "TOPLEFT" }, "text": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 427.6, "r_x1": 480.6, "r_y1": 427.6, "r_x2": 480.6, "r_y2": 419.6, "r_x3": 134.8, "r_y3": 419.6, "coord_origin": "TOPLEFT" }, "text": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "orig": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 438.6, "r_x1": 304.7, "r_y1": 438.6, "r_x2": 304.7, "r_y2": 430.5, "r_x3": 134.8, "r_y3": 430.5, "coord_origin": "TOPLEFT" }, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 342.6, "r_y0": 439.7, "r_x1": 344.8, "r_y1": 439.7, "r_x2": 344.8, "r_y2": 430.2, "r_x3": 342.6, "r_y3": 430.2, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 5. The OTSL model produces more accurate bounding boxes with less overlap (E) than the HTML model (D), when predicting the structure of a sparse table (A), at twice the inference speed because of shorter sequence length (B),(C). \"PMC2807444_006_00.png\" PubTabNet. \u03bc" }, { "label": "picture", "id": 2, "page_no": 9, "cluster": { "id": 2, "label": "picture", "bbox": { "l": 162.7, "t": 444.6, "r": 451.7, "b": 663.2, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 518.9, "r_x1": 190.6, "r_y1": 518.9, "r_x2": 190.6, "r_y2": 516.2, "r_x3": 180.1, "r_y3": 516.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 522.8, "r_x1": 304.5, "r_y1": 522.8, "r_x2": 304.5, "r_y2": 520.1, "r_x3": 183.2, "r_y3": 520.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 526.7, "r_x1": 388.4, "r_y1": 526.7, "r_x2": 388.4, "r_y2": 524.0, "r_x3": 183.2, "r_y3": 524.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 530.6, "r_x1": 388.4, "r_y1": 530.6, "r_x2": 388.4, "r_y2": 527.9, "r_x3": 183.2, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 534.5, "r_x1": 388.4, "r_y1": 534.5, "r_x2": 388.4, "r_y2": 531.8, "r_x3": 183.2, "r_y3": 531.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 538.4, "r_x1": 388.4, "r_y1": 538.4, "r_x2": 388.4, "r_y2": 535.7, "r_x3": 183.2, "r_y3": 535.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 542.3, "r_x1": 388.4, "r_y1": 542.3, "r_x2": 388.4, "r_y2": 539.6, "r_x3": 183.2, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 546.2, "r_x1": 388.4, "r_y1": 546.2, "r_x2": 388.4, "r_y2": 543.5, "r_x3": 183.2, "r_y3": 543.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 550.1, "r_x1": 388.4, "r_y1": 550.1, "r_x2": 388.4, "r_y2": 547.4, "r_x3": 183.2, "r_y3": 547.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 554.0, "r_x1": 388.4, "r_y1": 554.0, "r_x2": 388.4, "r_y2": 551.3, "r_x3": 183.2, "r_y3": 551.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 557.9, "r_x1": 191.9, "r_y1": 557.9, "r_x2": 191.9, "r_y2": 555.2, "r_x3": 180.1, "r_y3": 555.2, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 521.0, "r_x1": 408.8, "r_y1": 521.0, "r_x2": 408.8, "r_y2": 518.3, "r_x3": 407.4, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 521.0, "r_x1": 450.5, "r_y1": 521.0, "r_x2": 450.5, "r_y2": 518.3, "r_x3": 410.3, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 524.9, "r_x1": 408.8, "r_y1": 524.9, "r_x2": 408.8, "r_y2": 522.2, "r_x3": 407.4, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 524.9, "r_x1": 450.5, "r_y1": 524.9, "r_x2": 450.5, "r_y2": 522.2, "r_x3": 410.3, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 528.8, "r_x1": 408.8, "r_y1": 528.8, "r_x2": 408.8, "r_y2": 526.1, "r_x3": 407.4, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 528.8, "r_x1": 450.5, "r_y1": 528.8, "r_x2": 450.5, "r_y2": 526.1, "r_x3": 410.3, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 532.7, "r_x1": 408.8, "r_y1": 532.7, "r_x2": 408.8, "r_y2": 530.0, "r_x3": 407.4, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 532.7, "r_x1": 450.5, "r_y1": 532.7, "r_x2": 450.5, "r_y2": 530.0, "r_x3": 410.3, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 536.6, "r_x1": 408.8, "r_y1": 536.6, "r_x2": 408.8, "r_y2": 533.9, "r_x3": 407.4, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 536.6, "r_x1": 450.5, "r_y1": 536.6, "r_x2": 450.5, "r_y2": 533.9, "r_x3": 410.3, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 540.5, "r_x1": 408.8, "r_y1": 540.5, "r_x2": 408.8, "r_y2": 537.8, "r_x3": 407.4, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 540.5, "r_x1": 450.5, "r_y1": 540.5, "r_x2": 450.5, "r_y2": 537.8, "r_x3": 410.3, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 544.4, "r_x1": 408.8, "r_y1": 544.4, "r_x2": 408.8, "r_y2": 541.7, "r_x3": 407.4, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 544.4, "r_x1": 450.5, "r_y1": 544.4, "r_x2": 450.5, "r_y2": 541.7, "r_x3": 410.3, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 548.3, "r_x1": 408.8, "r_y1": 548.3, "r_x2": 408.8, "r_y2": 545.6, "r_x3": 407.4, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 548.3, "r_x1": 450.5, "r_y1": 548.3, "r_x2": 450.5, "r_y2": 545.6, "r_x3": 410.3, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 552.2, "r_x1": 408.8, "r_y1": 552.2, "r_x2": 408.8, "r_y2": 549.5, "r_x3": 407.4, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 552.2, "r_x1": 450.5, "r_y1": 552.2, "r_x2": 450.5, "r_y2": 549.5, "r_x3": 410.3, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.5, "r_y0": 515.3, "r_x1": 181.9, "r_y1": 515.3, "r_x2": 181.9, "r_y2": 509.5, "r_x3": 164.5, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.6, "r_y0": 515.3, "r_x1": 186.4, "r_y1": 515.3, "r_x2": 186.4, "r_y2": 509.5, "r_x3": 183.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2, "r_y0": 515.3, "r_x1": 208.9, "r_y1": 515.3, "r_x2": 208.9, "r_y2": 509.5, "r_x3": 189.2, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.6, "r_y0": 515.3, "r_x1": 221.0, "r_y1": 515.3, "r_x2": 221.0, "r_y2": 509.5, "r_x3": 210.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.5, "r_x1": 406.8, "r_y1": 515.5, "r_x2": 406.8, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.6, "r_y0": 515.5, "r_x1": 411.4, "r_y1": 515.5, "r_x2": 411.4, "r_y2": 509.6, "r_x3": 408.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.5, "r_x1": 433.9, "r_y1": 515.5, "r_x2": 433.9, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 515.5, "r_x1": 446.0, "r_y1": 515.5, "r_x2": 446.0, "r_y2": 509.6, "r_x3": 435.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.2, "r_y0": 526.4, "r_x1": 172.8, "r_y1": 526.4, "r_x2": 172.8, "r_y2": 519.1, "r_x3": 167.2, "r_y3": 519.1, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.3, "r_y0": 455.9, "r_x1": 193.0, "r_y1": 455.9, "r_x2": 193.0, "r_y2": 448.6, "r_x3": 187.3, "r_y3": 448.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.4, "r_y0": 573.3, "r_x1": 173.0, "r_y1": 573.3, "r_x2": 173.0, "r_y2": 566.0, "r_x3": 167.4, "r_y3": 566.0, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.5, "r_y0": 629.1, "r_x1": 253.7, "r_y1": 629.1, "r_x2": 253.7, "r_y2": 621.8, "r_x3": 248.5, "r_y3": 621.8, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.5, "r_x1": 401.5, "r_y1": 526.5, "r_x2": 401.5, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.6, "r_y0": 597.3, "r_x1": 177.5, "r_y1": 597.3, "r_x2": 177.5, "r_y2": 580.3, "r_x3": 171.6, "r_y3": 580.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.1, "r_y0": 649.9, "r_x1": 256.9, "r_y1": 649.9, "r_x2": 256.9, "r_y2": 633.6, "r_x3": 251.1, "r_y3": 633.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 607.3, "r_x1": 427.0, "r_y1": 607.3, "r_x2": 427.0, "r_y2": 601.5, "r_x3": 372.1, "r_y3": 601.5, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 613.8, "r_x1": 430.1, "r_y1": 613.8, "r_x2": 430.1, "r_y2": 607.9, "r_x3": 372.1, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 648.7, "r_x1": 231.1, "r_y1": 648.7, "r_x2": 231.1, "r_y2": 642.9, "r_x3": 176.9, "r_y3": 642.9, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 655.2, "r_x1": 231.0, "r_y1": 655.2, "r_x2": 231.0, "r_y2": 649.3, "r_x3": 176.9, "r_y3": 649.3, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 661.6, "r_x1": 203.9, "r_y1": 661.6, "r_x2": 203.9, "r_y2": 655.8, "r_x3": 176.9, "r_y3": 655.8, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.9, "r_y0": 569.2, "r_x1": 218.5, "r_y1": 569.2, "r_x2": 218.5, "r_y2": 557.6, "r_x3": 215.9, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.1, "r_y0": 569.2, "r_x1": 231.7, "r_y1": 569.2, "r_x2": 231.7, "r_y2": 557.6, "r_x3": 229.1, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.2, "r_y0": 451.2, "r_x1": 263.6, "r_y1": 451.2, "r_x2": 263.6, "r_y2": 448.5, "r_x3": 261.2, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.3, "r_y0": 451.2, "r_x1": 313.6, "r_y1": 451.2, "r_x2": 313.6, "r_y2": 448.5, "r_x3": 312.3, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.4, "r_y0": 451.2, "r_x1": 380.1, "r_y1": 451.2, "r_x2": 380.1, "r_y2": 448.5, "r_x3": 377.4, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 456.1, "r_x1": 205.8, "r_y1": 456.1, "r_x2": 205.8, "r_y2": 453.3, "r_x3": 200.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.2, "r_y0": 456.1, "r_x1": 229.8, "r_y1": 456.1, "r_x2": 229.8, "r_y2": 453.3, "r_x3": 222.2, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 456.1, "r_x1": 250.8, "r_y1": 456.1, "r_x2": 250.8, "r_y2": 453.3, "r_x3": 243.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.1, "r_x1": 271.8, "r_y1": 456.1, "r_x2": 271.8, "r_y2": 453.3, "r_x3": 264.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.3, "r_y0": 456.1, "r_x1": 292.9, "r_y1": 456.1, "r_x2": 292.9, "r_y2": 453.3, "r_x3": 285.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 456.1, "r_x1": 311.8, "r_y1": 456.1, "r_x2": 311.8, "r_y2": 453.3, "r_x3": 306.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 456.1, "r_x1": 325.6, "r_y1": 456.1, "r_x2": 325.6, "r_y2": 453.3, "r_x3": 323.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 456.1, "r_x1": 336.6, "r_y1": 456.1, "r_x2": 336.6, "r_y2": 453.3, "r_x3": 334.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 456.1, "r_x1": 347.7, "r_y1": 456.1, "r_x2": 347.7, "r_y2": 453.3, "r_x3": 345.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 456.1, "r_x1": 358.7, "r_y1": 456.1, "r_x2": 358.7, "r_y2": 453.3, "r_x3": 356.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 456.1, "r_x1": 372.0, "r_y1": 456.1, "r_x2": 372.0, "r_y2": 453.3, "r_x3": 367.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 456.1, "r_x1": 387.0, "r_y1": 456.1, "r_x2": 387.0, "r_y2": 453.3, "r_x3": 382.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 456.1, "r_x1": 402.1, "r_y1": 456.1, "r_x2": 402.1, "r_y2": 453.3, "r_x3": 397.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 457.8, "r_x1": 414.9, "r_y1": 457.8, "r_x2": 414.9, "r_y2": 448.0, "r_x3": 412.8, "r_y3": 448.0, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.0, "r_y0": 456.1, "r_x1": 422.5, "r_y1": 456.1, "r_x2": 422.5, "r_y2": 453.3, "r_x3": 415.0, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 466.7, "r_x1": 204.6, "r_y1": 466.7, "r_x2": 204.6, "r_y2": 463.9, "r_x3": 200.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 466.7, "r_x1": 369.6, "r_y1": 466.7, "r_x2": 369.6, "r_y2": 463.9, "r_x3": 367.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 466.7, "r_x1": 384.6, "r_y1": 466.7, "r_x2": 384.6, "r_y2": 463.9, "r_x3": 382.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 466.7, "r_x1": 399.7, "r_y1": 466.7, "r_x2": 399.7, "r_y2": 463.9, "r_x3": 397.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 471.5, "r_x1": 206.5, "r_y1": 471.5, "r_x2": 206.5, "r_y2": 468.8, "r_x3": 200.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 471.5, "r_x1": 266.3, "r_y1": 471.5, "r_x2": 266.3, "r_y2": 468.8, "r_x3": 264.3, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 471.5, "r_x1": 308.3, "r_y1": 471.5, "r_x2": 308.3, "r_y2": 468.8, "r_x3": 306.4, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 471.5, "r_x1": 347.5, "r_y1": 471.5, "r_x2": 347.5, "r_y2": 468.8, "r_x3": 345.5, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 471.5, "r_x1": 358.5, "r_y1": 471.5, "r_x2": 358.5, "r_y2": 468.8, "r_x3": 356.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 471.5, "r_x1": 369.6, "r_y1": 471.5, "r_x2": 369.6, "r_y2": 468.8, "r_x3": 367.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 471.5, "r_x1": 384.6, "r_y1": 471.5, "r_x2": 384.6, "r_y2": 468.8, "r_x3": 382.7, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 476.4, "r_x1": 206.5, "r_y1": 476.4, "r_x2": 206.5, "r_y2": 473.7, "r_x3": 200.6, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 476.4, "r_x1": 266.3, "r_y1": 476.4, "r_x2": 266.3, "r_y2": 473.7, "r_x3": 264.3, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 481.3, "r_x1": 206.5, "r_y1": 481.3, "r_x2": 206.5, "r_y2": 478.5, "r_x3": 200.6, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 481.3, "r_x1": 245.2, "r_y1": 481.3, "r_x2": 245.2, "r_y2": 478.5, "r_x3": 243.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 481.3, "r_x1": 266.3, "r_y1": 481.3, "r_x2": 266.3, "r_y2": 478.5, "r_x3": 264.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.3, "r_x1": 325.4, "r_y1": 481.3, "r_x2": 325.4, "r_y2": 478.5, "r_x3": 323.4, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 481.3, "r_x1": 399.7, "r_y1": 481.3, "r_x2": 399.7, "r_y2": 478.5, "r_x3": 397.7, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 486.1, "r_x1": 206.5, "r_y1": 486.1, "r_x2": 206.5, "r_y2": 483.4, "r_x3": 200.6, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 486.1, "r_x1": 384.6, "r_y1": 486.1, "r_x2": 384.6, "r_y2": 483.4, "r_x3": 382.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 486.1, "r_x1": 401.6, "r_y1": 486.1, "r_x2": 401.6, "r_y2": 483.4, "r_x3": 397.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 486.1, "r_x1": 414.7, "r_y1": 486.1, "r_x2": 414.7, "r_y2": 483.4, "r_x3": 412.8, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 491.0, "r_x1": 207.1, "r_y1": 491.0, "r_x2": 207.1, "r_y2": 488.3, "r_x3": 200.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 491.0, "r_x1": 369.8, "r_y1": 491.0, "r_x2": 369.8, "r_y2": 488.3, "r_x3": 367.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 491.0, "r_x1": 384.8, "r_y1": 491.0, "r_x2": 384.8, "r_y2": 488.3, "r_x3": 382.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 491.0, "r_x1": 402.1, "r_y1": 491.0, "r_x2": 402.1, "r_y2": 488.3, "r_x3": 397.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 495.9, "r_x1": 208.5, "r_y1": 495.9, "r_x2": 208.5, "r_y2": 493.2, "r_x3": 200.6, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 495.9, "r_x1": 266.3, "r_y1": 495.9, "r_x2": 266.3, "r_y2": 493.2, "r_x3": 264.3, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 58, "label": "text", "bbox": { "l": 180.1, "t": 516.2, "r": 190.6, "b": 518.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 518.9, "r_x1": 190.6, "r_y1": 518.9, "r_x2": 190.6, "r_y2": 516.2, "r_x3": 180.1, "r_y3": 516.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 183.2, "t": 520.1, "r": 304.5, "b": 522.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 522.8, "r_x1": 304.5, "r_y1": 522.8, "r_x2": 304.5, "r_y2": 520.1, "r_x3": 183.2, "r_y3": 520.1, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.2, "t": 524.0, "r": 388.4, "b": 526.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 526.7, "r_x1": 388.4, "r_y1": 526.7, "r_x2": 388.4, "r_y2": 524.0, "r_x3": 183.2, "r_y3": 524.0, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 183.2, "t": 527.9, "r": 388.4, "b": 530.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 530.6, "r_x1": 388.4, "r_y1": 530.6, "r_x2": 388.4, "r_y2": 527.9, "r_x3": 183.2, "r_y3": 527.9, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 183.2, "t": 531.8, "r": 388.4, "b": 534.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 534.5, "r_x1": 388.4, "r_y1": 534.5, "r_x2": 388.4, "r_y2": 531.8, "r_x3": 183.2, "r_y3": 531.8, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 183.2, "t": 535.7, "r": 388.4, "b": 538.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 538.4, "r_x1": 388.4, "r_y1": 538.4, "r_x2": 388.4, "r_y2": 535.7, "r_x3": 183.2, "r_y3": 535.7, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 183.2, "t": 539.6, "r": 388.4, "b": 542.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 542.3, "r_x1": 388.4, "r_y1": 542.3, "r_x2": 388.4, "r_y2": 539.6, "r_x3": 183.2, "r_y3": 539.6, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 183.2, "t": 543.5, "r": 388.4, "b": 546.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 546.2, "r_x1": 388.4, "r_y1": 546.2, "r_x2": 388.4, "r_y2": 543.5, "r_x3": 183.2, "r_y3": 543.5, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 183.2, "t": 547.4, "r": 388.4, "b": 550.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 550.1, "r_x1": 388.4, "r_y1": 550.1, "r_x2": 388.4, "r_y2": 547.4, "r_x3": 183.2, "r_y3": 547.4, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.2, "t": 551.3, "r": 388.4, "b": 554.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.2, "r_y0": 554.0, "r_x1": 388.4, "r_y1": 554.0, "r_x2": 388.4, "r_y2": 551.3, "r_x3": 183.2, "r_y3": 551.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 180.1, "t": 555.2, "r": 191.9, "b": 557.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.1, "r_y0": 557.9, "r_x1": 191.9, "r_y1": 557.9, "r_x2": 191.9, "r_y2": 555.2, "r_x3": 180.1, "r_y3": 555.2, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 407.4, "t": 518.3, "r": 408.8, "b": 521.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 521.0, "r_x1": 408.8, "r_y1": 521.0, "r_x2": 408.8, "r_y2": 518.3, "r_x3": 407.4, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 410.3, "t": 518.3, "r": 450.5, "b": 521.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 521.0, "r_x1": 450.5, "r_y1": 521.0, "r_x2": 450.5, "r_y2": 518.3, "r_x3": 410.3, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 407.4, "t": 522.2, "r": 408.8, "b": 524.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 524.9, "r_x1": 408.8, "r_y1": 524.9, "r_x2": 408.8, "r_y2": 522.2, "r_x3": 407.4, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 410.3, "t": 522.2, "r": 450.5, "b": 524.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 524.9, "r_x1": 450.5, "r_y1": 524.9, "r_x2": 450.5, "r_y2": 522.2, "r_x3": 410.3, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 407.4, "t": 526.1, "r": 408.8, "b": 528.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 528.8, "r_x1": 408.8, "r_y1": 528.8, "r_x2": 408.8, "r_y2": 526.1, "r_x3": 407.4, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 410.3, "t": 526.1, "r": 450.5, "b": 528.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 528.8, "r_x1": 450.5, "r_y1": 528.8, "r_x2": 450.5, "r_y2": 526.1, "r_x3": 410.3, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 407.4, "t": 530.0, "r": 408.8, "b": 532.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 532.7, "r_x1": 408.8, "r_y1": 532.7, "r_x2": 408.8, "r_y2": 530.0, "r_x3": 407.4, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 410.3, "t": 530.0, "r": 450.5, "b": 532.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 532.7, "r_x1": 450.5, "r_y1": 532.7, "r_x2": 450.5, "r_y2": 530.0, "r_x3": 410.3, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 407.4, "t": 533.9, "r": 408.8, "b": 536.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 536.6, "r_x1": 408.8, "r_y1": 536.6, "r_x2": 408.8, "r_y2": 533.9, "r_x3": 407.4, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 410.3, "t": 533.9, "r": 450.5, "b": 536.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 536.6, "r_x1": 450.5, "r_y1": 536.6, "r_x2": 450.5, "r_y2": 533.9, "r_x3": 410.3, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 407.4, "t": 537.8, "r": 408.8, "b": 540.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 540.5, "r_x1": 408.8, "r_y1": 540.5, "r_x2": 408.8, "r_y2": 537.8, "r_x3": 407.4, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 410.3, "t": 537.8, "r": 450.5, "b": 540.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 540.5, "r_x1": 450.5, "r_y1": 540.5, "r_x2": 450.5, "r_y2": 537.8, "r_x3": 410.3, "r_y3": 537.8, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 407.4, "t": 541.7, "r": 408.8, "b": 544.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 544.4, "r_x1": 408.8, "r_y1": 544.4, "r_x2": 408.8, "r_y2": 541.7, "r_x3": 407.4, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 410.3, "t": 541.7, "r": 450.5, "b": 544.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 544.4, "r_x1": 450.5, "r_y1": 544.4, "r_x2": 450.5, "r_y2": 541.7, "r_x3": 410.3, "r_y3": 541.7, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 407.4, "t": 545.6, "r": 408.8, "b": 548.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 548.3, "r_x1": 408.8, "r_y1": 548.3, "r_x2": 408.8, "r_y2": 545.6, "r_x3": 407.4, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 410.3, "t": 545.6, "r": 450.5, "b": 548.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 548.3, "r_x1": 450.5, "r_y1": 548.3, "r_x2": 450.5, "r_y2": 545.6, "r_x3": 410.3, "r_y3": 545.6, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 407.4, "t": 549.5, "r": 408.8, "b": 552.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 552.2, "r_x1": 408.8, "r_y1": 552.2, "r_x2": 408.8, "r_y2": 549.5, "r_x3": 407.4, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 410.3, "t": 549.5, "r": 450.5, "b": 552.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.3, "r_y0": 552.2, "r_x1": 450.5, "r_y1": 552.2, "r_x2": 450.5, "r_y2": 549.5, "r_x3": 410.3, "r_y3": 549.5, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 164.5, "t": 509.5, "r": 181.9, "b": 515.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.5, "r_y0": 515.3, "r_x1": 181.9, "r_y1": 515.3, "r_x2": 181.9, "r_y2": 509.5, "r_x3": 164.5, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.6, "t": 509.5, "r": 186.4, "b": 515.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.6, "r_y0": 515.3, "r_x1": 186.4, "r_y1": 515.3, "r_x2": 186.4, "r_y2": 509.5, "r_x3": 183.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 189.2, "t": 509.5, "r": 208.9, "b": 515.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.2, "r_y0": 515.3, "r_x1": 208.9, "r_y1": 515.3, "r_x2": 208.9, "r_y2": 509.5, "r_x3": 189.2, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 210.6, "t": 509.5, "r": 221.0, "b": 515.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.6, "r_y0": 515.3, "r_x1": 221.0, "r_y1": 515.3, "r_x2": 221.0, "r_y2": 509.5, "r_x3": 210.6, "r_y3": 509.5, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 390.2, "t": 509.6, "r": 406.8, "b": 515.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.5, "r_x1": 406.8, "r_y1": 515.5, "r_x2": 406.8, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 408.6, "t": 509.6, "r": 411.4, "b": 515.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.6, "r_y0": 515.5, "r_x1": 411.4, "r_y1": 515.5, "r_x2": 411.4, "r_y2": 509.6, "r_x3": 408.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 414.2, "t": 509.6, "r": 433.9, "b": 515.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.5, "r_x1": 433.9, "r_y1": 515.5, "r_x2": 433.9, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 435.6, "t": 509.6, "r": 446.0, "b": 515.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 515.5, "r_x1": 446.0, "r_y1": 515.5, "r_x2": 446.0, "r_y2": 509.6, "r_x3": 435.6, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 167.2, "t": 519.1, "r": 172.8, "b": 526.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.2, "r_y0": 526.4, "r_x1": 172.8, "r_y1": 526.4, "r_x2": 172.8, "r_y2": 519.1, "r_x3": 167.2, "r_y3": 519.1, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 187.3, "t": 448.6, "r": 193.0, "b": 455.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.3, "r_y0": 455.9, "r_x1": 193.0, "r_y1": 455.9, "r_x2": 193.0, "r_y2": 448.6, "r_x3": 187.3, "r_y3": 448.6, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 167.4, "t": 566.0, "r": 173.0, "b": 573.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.4, "r_y0": 573.3, "r_x1": 173.0, "r_y1": 573.3, "r_x2": 173.0, "r_y2": 566.0, "r_x3": 167.4, "r_y3": 566.0, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 248.5, "t": 621.8, "r": 253.7, "b": 629.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.5, "r_y0": 629.1, "r_x1": 253.7, "r_y1": 629.1, "r_x2": 253.7, "r_y2": 621.8, "r_x3": 248.5, "r_y3": 621.8, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 395.9, "t": 519.2, "r": 401.5, "b": 526.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.5, "r_x1": 401.5, "r_y1": 526.5, "r_x2": 401.5, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 171.6, "t": 580.3, "r": 177.5, "b": 597.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.6, "r_y0": 597.3, "r_x1": 177.5, "r_y1": 597.3, "r_x2": 177.5, "r_y2": 580.3, "r_x3": 171.6, "r_y3": 580.3, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 251.1, "t": 633.6, "r": 256.9, "b": 649.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.1, "r_y0": 649.9, "r_x1": 256.9, "r_y1": 649.9, "r_x2": 256.9, "r_y2": 633.6, "r_x3": 251.1, "r_y3": 633.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 372.1, "t": 601.5, "r": 427.0, "b": 607.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 607.3, "r_x1": 427.0, "r_y1": 607.3, "r_x2": 427.0, "r_y2": 601.5, "r_x3": 372.1, "r_y3": 601.5, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 372.1, "t": 607.9, "r": 430.1, "b": 613.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.1, "r_y0": 613.8, "r_x1": 430.1, "r_y1": 613.8, "r_x2": 430.1, "r_y2": 607.9, "r_x3": 372.1, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 176.9, "t": 642.9, "r": 231.1, "b": 648.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 648.7, "r_x1": 231.1, "r_y1": 648.7, "r_x2": 231.1, "r_y2": 642.9, "r_x3": 176.9, "r_y3": 642.9, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 176.9, "t": 649.3, "r": 231.0, "b": 655.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 655.2, "r_x1": 231.0, "r_y1": 655.2, "r_x2": 231.0, "r_y2": 649.3, "r_x3": 176.9, "r_y3": 649.3, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 176.9, "t": 655.8, "r": 203.9, "b": 661.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.9, "r_y0": 661.6, "r_x1": 203.9, "r_y1": 661.6, "r_x2": 203.9, "r_y2": 655.8, "r_x3": 176.9, "r_y3": 655.8, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 215.9, "t": 557.6, "r": 218.5, "b": 569.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.9, "r_y0": 569.2, "r_x1": 218.5, "r_y1": 569.2, "r_x2": 218.5, "r_y2": 557.6, "r_x3": 215.9, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 229.1, "t": 557.6, "r": 231.7, "b": 569.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.1, "r_y0": 569.2, "r_x1": 231.7, "r_y1": 569.2, "r_x2": 231.7, "r_y2": 557.6, "r_x3": 229.1, "r_y3": 557.6, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 261.2, "t": 448.5, "r": 263.6, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.2, "r_y0": 451.2, "r_x1": 263.6, "r_y1": 451.2, "r_x2": 263.6, "r_y2": 448.5, "r_x3": 261.2, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 312.3, "t": 448.5, "r": 313.6, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.3, "r_y0": 451.2, "r_x1": 313.6, "r_y1": 451.2, "r_x2": 313.6, "r_y2": 448.5, "r_x3": 312.3, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 377.4, "t": 448.5, "r": 380.1, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.4, "r_y0": 451.2, "r_x1": 380.1, "r_y1": 451.2, "r_x2": 380.1, "r_y2": 448.5, "r_x3": 377.4, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 200.6, "t": 453.3, "r": 205.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 456.1, "r_x1": 205.8, "r_y1": 456.1, "r_x2": 205.8, "r_y2": 453.3, "r_x3": 200.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 222.2, "t": 453.3, "r": 229.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.2, "r_y0": 456.1, "r_x1": 229.8, "r_y1": 456.1, "r_x2": 229.8, "r_y2": 453.3, "r_x3": 222.2, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 243.3, "t": 453.3, "r": 250.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 456.1, "r_x1": 250.8, "r_y1": 456.1, "r_x2": 250.8, "r_y2": 453.3, "r_x3": 243.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 264.3, "t": 453.3, "r": 271.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.1, "r_x1": 271.8, "r_y1": 456.1, "r_x2": 271.8, "r_y2": 453.3, "r_x3": 264.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 285.3, "t": 453.3, "r": 292.9, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.3, "r_y0": 456.1, "r_x1": 292.9, "r_y1": 456.1, "r_x2": 292.9, "r_y2": 453.3, "r_x3": 285.3, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 306.4, "t": 453.3, "r": 311.8, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 456.1, "r_x1": 311.8, "r_y1": 456.1, "r_x2": 311.8, "r_y2": 453.3, "r_x3": 306.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 323.4, "t": 453.3, "r": 325.6, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 456.1, "r_x1": 325.6, "r_y1": 456.1, "r_x2": 325.6, "r_y2": 453.3, "r_x3": 323.4, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 334.5, "t": 453.3, "r": 336.6, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.5, "r_y0": 456.1, "r_x1": 336.6, "r_y1": 456.1, "r_x2": 336.6, "r_y2": 453.3, "r_x3": 334.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 345.5, "t": 453.3, "r": 347.7, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 456.1, "r_x1": 347.7, "r_y1": 456.1, "r_x2": 347.7, "r_y2": 453.3, "r_x3": 345.5, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 356.6, "t": 453.3, "r": 358.7, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 456.1, "r_x1": 358.7, "r_y1": 456.1, "r_x2": 358.7, "r_y2": 453.3, "r_x3": 356.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 367.6, "t": 453.3, "r": 372.0, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 456.1, "r_x1": 372.0, "r_y1": 456.1, "r_x2": 372.0, "r_y2": 453.3, "r_x3": 367.6, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 382.7, "t": 453.3, "r": 387.0, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 456.1, "r_x1": 387.0, "r_y1": 456.1, "r_x2": 387.0, "r_y2": 453.3, "r_x3": 382.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 397.7, "t": 453.3, "r": 402.1, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 456.1, "r_x1": 402.1, "r_y1": 456.1, "r_x2": 402.1, "r_y2": 453.3, "r_x3": 397.7, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 412.8, "t": 448.0, "r": 414.9, "b": 457.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 457.8, "r_x1": 414.9, "r_y1": 457.8, "r_x2": 414.9, "r_y2": 448.0, "r_x3": 412.8, "r_y3": 448.0, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 415.0, "t": 453.3, "r": 422.5, "b": 456.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 415.0, "r_y0": 456.1, "r_x1": 422.5, "r_y1": 456.1, "r_x2": 422.5, "r_y2": 453.3, "r_x3": 415.0, "r_y3": 453.3, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 200.6, "t": 463.9, "r": 204.6, "b": 466.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 466.7, "r_x1": 204.6, "r_y1": 466.7, "r_x2": 204.6, "r_y2": 463.9, "r_x3": 200.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 367.6, "t": 463.9, "r": 369.6, "b": 466.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 466.7, "r_x1": 369.6, "r_y1": 466.7, "r_x2": 369.6, "r_y2": 463.9, "r_x3": 367.6, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 382.7, "t": 463.9, "r": 384.6, "b": 466.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 466.7, "r_x1": 384.6, "r_y1": 466.7, "r_x2": 384.6, "r_y2": 463.9, "r_x3": 382.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 397.7, "t": 463.9, "r": 399.7, "b": 466.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 466.7, "r_x1": 399.7, "r_y1": 466.7, "r_x2": 399.7, "r_y2": 463.9, "r_x3": 397.7, "r_y3": 463.9, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 200.6, "t": 468.8, "r": 206.5, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 471.5, "r_x1": 206.5, "r_y1": 471.5, "r_x2": 206.5, "r_y2": 468.8, "r_x3": 200.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 264.3, "t": 468.8, "r": 266.3, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 471.5, "r_x1": 266.3, "r_y1": 471.5, "r_x2": 266.3, "r_y2": 468.8, "r_x3": 264.3, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 306.4, "t": 468.8, "r": 308.3, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.4, "r_y0": 471.5, "r_x1": 308.3, "r_y1": 471.5, "r_x2": 308.3, "r_y2": 468.8, "r_x3": 306.4, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 345.5, "t": 468.8, "r": 347.5, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.5, "r_y0": 471.5, "r_x1": 347.5, "r_y1": 471.5, "r_x2": 347.5, "r_y2": 468.8, "r_x3": 345.5, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 356.6, "t": 468.8, "r": 358.5, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.6, "r_y0": 471.5, "r_x1": 358.5, "r_y1": 471.5, "r_x2": 358.5, "r_y2": 468.8, "r_x3": 356.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 367.6, "t": 468.8, "r": 369.6, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 471.5, "r_x1": 369.6, "r_y1": 471.5, "r_x2": 369.6, "r_y2": 468.8, "r_x3": 367.6, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 382.7, "t": 468.8, "r": 384.6, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 471.5, "r_x1": 384.6, "r_y1": 471.5, "r_x2": 384.6, "r_y2": 468.8, "r_x3": 382.7, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 200.6, "t": 473.7, "r": 206.5, "b": 476.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 476.4, "r_x1": 206.5, "r_y1": 476.4, "r_x2": 206.5, "r_y2": 473.7, "r_x3": 200.6, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 264.3, "t": 473.7, "r": 266.3, "b": 476.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 476.4, "r_x1": 266.3, "r_y1": 476.4, "r_x2": 266.3, "r_y2": 473.7, "r_x3": 264.3, "r_y3": 473.7, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 200.6, "t": 478.5, "r": 206.5, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 481.3, "r_x1": 206.5, "r_y1": 481.3, "r_x2": 206.5, "r_y2": 478.5, "r_x3": 200.6, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 243.3, "t": 478.5, "r": 245.2, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.3, "r_y0": 481.3, "r_x1": 245.2, "r_y1": 481.3, "r_x2": 245.2, "r_y2": 478.5, "r_x3": 243.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 264.3, "t": 478.5, "r": 266.3, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 481.3, "r_x1": 266.3, "r_y1": 481.3, "r_x2": 266.3, "r_y2": 478.5, "r_x3": 264.3, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 323.4, "t": 478.5, "r": 325.4, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.3, "r_x1": 325.4, "r_y1": 481.3, "r_x2": 325.4, "r_y2": 478.5, "r_x3": 323.4, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 397.7, "t": 478.5, "r": 399.7, "b": 481.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 481.3, "r_x1": 399.7, "r_y1": 481.3, "r_x2": 399.7, "r_y2": 478.5, "r_x3": 397.7, "r_y3": 478.5, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 200.6, "t": 483.4, "r": 206.5, "b": 486.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 486.1, "r_x1": 206.5, "r_y1": 486.1, "r_x2": 206.5, "r_y2": 483.4, "r_x3": 200.6, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 382.7, "t": 483.4, "r": 384.6, "b": 486.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 486.1, "r_x1": 384.6, "r_y1": 486.1, "r_x2": 384.6, "r_y2": 483.4, "r_x3": 382.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 397.7, "t": 483.4, "r": 401.6, "b": 486.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 486.1, "r_x1": 401.6, "r_y1": 486.1, "r_x2": 401.6, "r_y2": 483.4, "r_x3": 397.7, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 412.8, "t": 483.4, "r": 414.7, "b": 486.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.8, "r_y0": 486.1, "r_x1": 414.7, "r_y1": 486.1, "r_x2": 414.7, "r_y2": 483.4, "r_x3": 412.8, "r_y3": 483.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 200.6, "t": 488.3, "r": 207.1, "b": 491.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 491.0, "r_x1": 207.1, "r_y1": 491.0, "r_x2": 207.1, "r_y2": 488.3, "r_x3": 200.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 367.6, "t": 488.3, "r": 369.8, "b": 491.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.6, "r_y0": 491.0, "r_x1": 369.8, "r_y1": 491.0, "r_x2": 369.8, "r_y2": 488.3, "r_x3": 367.6, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 382.7, "t": 488.3, "r": 384.8, "b": 491.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.7, "r_y0": 491.0, "r_x1": 384.8, "r_y1": 491.0, "r_x2": 384.8, "r_y2": 488.3, "r_x3": 382.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 397.7, "t": 488.3, "r": 402.1, "b": 491.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.7, "r_y0": 491.0, "r_x1": 402.1, "r_y1": 491.0, "r_x2": 402.1, "r_y2": 488.3, "r_x3": 397.7, "r_y3": 488.3, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 200.6, "t": 493.2, "r": 208.5, "b": 495.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.6, "r_y0": 495.9, "r_x1": 208.5, "r_y1": 495.9, "r_x2": 208.5, "r_y2": 493.2, "r_x3": 200.6, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 264.3, "t": 493.2, "r": 266.3, "b": 495.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 495.9, "r_x1": 266.3, "r_y1": 495.9, "r_x2": 266.3, "r_y2": 493.2, "r_x3": 264.3, "r_y3": 493.2, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 155, "page_no": 9, "cluster": { "id": 155, "label": "text", "bbox": { "l": 227.9, "t": 665.8, "r": 230.1, "b": 675.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.9, "r_y0": 675.3, "r_x1": 230.1, "r_y1": 675.3, "r_x2": 230.1, "r_y2": 665.8, "r_x3": 227.9, "r_y3": 665.8, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u03bc" }, { "label": "text", "id": 156, "page_no": 9, "cluster": { "id": 156, "label": "text", "bbox": { "l": 300.6, "t": 683.6, "r": 302.7, "b": 693.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.6, "r_y0": 693.4, "r_x1": 302.7, "r_y1": 693.4, "r_x2": 302.7, "r_y2": 683.6, "r_x3": 300.6, "r_y3": 683.6, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u2265" } ], "headers": [ { "label": "page_header", "id": 7, "page_no": 9, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 144.0, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.83, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 144.0, "r_y1": 101.8, "r_x2": 144.0, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10" }, { "label": "page_header", "id": 6, "page_no": 9, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.84, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 10, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.4, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 471.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 133.7, "r_x1": 162.6, "r_y1": 133.7, "r_x2": 162.6, "r_y2": 125.8, "r_x3": 134.8, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.2, "r_y0": 133.9, "r_x1": 480.6, "r_y1": 133.9, "r_x2": 480.6, "r_y2": 125.9, "r_x3": 165.2, "r_y3": 125.9, "coord_origin": "TOPLEFT" }, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 144.9, "r_x1": 480.6, "r_y1": 144.9, "r_x2": 480.6, "r_y2": 136.8, "r_x3": 134.8, "r_y3": 136.8, "coord_origin": "TOPLEFT" }, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 155.8, "r_x1": 480.6, "r_y1": 155.8, "r_x2": 480.6, "r_y2": 147.8, "r_x3": 134.8, "r_y3": 147.8, "coord_origin": "TOPLEFT" }, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 166.8, "r_x1": 480.6, "r_y1": 166.8, "r_x2": 480.6, "r_y2": 158.7, "r_x3": 134.8, "r_y3": 158.7, "coord_origin": "TOPLEFT" }, "text": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 177.8, "r_x1": 415.8, "r_y1": 177.8, "r_x2": 415.8, "r_y2": 169.7, "r_x3": 134.8, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.4, "r_x1": 177.6, "r_y1": 320.4, "r_x2": 177.6, "r_y2": 312.5, "r_x3": 171.5, "r_y3": 312.5, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.1, "r_y0": 500.6, "r_x1": 177.1, "r_y1": 500.6, "r_x2": 177.1, "r_y2": 492.7, "r_x3": 171.1, "r_y3": 492.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 633.4, "r_x1": 375.0, "r_y1": 633.4, "r_x2": 375.0, "r_y2": 627.5, "r_x3": 283.0, "r_y3": 627.5, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 623.3, "r_x1": 398.1, "r_y1": 623.3, "r_x2": 398.1, "r_y2": 617.4, "r_x3": 283.0, "r_y3": 617.4, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.6, "r_y0": 471.5, "r_x1": 437.5, "r_y1": 471.5, "r_x2": 437.5, "r_y2": 465.6, "r_x3": 293.6, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 294.3, "r_x1": 239.2, "r_y1": 294.3, "r_x2": 239.2, "r_y2": 288.4, "r_x3": 181.9, "r_y3": 288.4, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 300.8, "r_x1": 251.5, "r_y1": 300.8, "r_x2": 251.5, "r_y2": 294.9, "r_x3": 181.9, "r_y3": 294.9, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.8, "r_y0": 194.8, "r_x1": 253.6, "r_y1": 194.8, "r_x2": 253.6, "r_y2": 184.8, "r_x3": 247.8, "r_y3": 184.8, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.2, "r_y0": 613.7, "r_x1": 381.5, "r_y1": 613.7, "r_x2": 381.5, "r_y2": 607.8, "r_x3": 292.2, "r_y3": 607.8, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 403.4, "r_x1": 180.2, "r_y1": 403.4, "r_x2": 180.2, "r_y2": 381.4, "r_x3": 172.3, "r_y3": 381.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 578.7, "r_x1": 180.2, "r_y1": 578.7, "r_x2": 180.2, "r_y2": 555.8, "r_x3": 172.3, "r_y3": 555.8, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 0, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "page_header", "bbox": { "l": 471.4, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.9, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.4, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 471.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "caption", "bbox": { "l": 134.8, "t": 125.8, "r": 480.6, "b": 177.8, "coord_origin": "TOPLEFT" }, "confidence": 0.87, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 133.7, "r_x1": 162.6, "r_y1": 133.7, "r_x2": 162.6, "r_y2": 125.8, "r_x3": 134.8, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.2, "r_y0": 133.9, "r_x1": 480.6, "r_y1": 133.9, "r_x2": 480.6, "r_y2": 125.9, "r_x3": 165.2, "r_y3": 125.9, "coord_origin": "TOPLEFT" }, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 144.9, "r_x1": 480.6, "r_y1": 144.9, "r_x2": 480.6, "r_y2": 136.8, "r_x3": 134.8, "r_y3": 136.8, "coord_origin": "TOPLEFT" }, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 155.8, "r_x1": 480.6, "r_y1": 155.8, "r_x2": 480.6, "r_y2": 147.8, "r_x3": 134.8, "r_y3": 147.8, "coord_origin": "TOPLEFT" }, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 166.8, "r_x1": 480.6, "r_y1": 166.8, "r_x2": 480.6, "r_y2": 158.7, "r_x3": 134.8, "r_y3": 158.7, "coord_origin": "TOPLEFT" }, "text": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 177.8, "r_x1": 415.8, "r_y1": 177.8, "r_x2": 415.8, "r_y2": 169.7, "r_x3": 134.8, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "picture", "bbox": { "l": 168.4, "t": 182.0, "r": 447.4, "b": 634.0, "coord_origin": "TOPLEFT" }, "confidence": 0.76, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.4, "r_x1": 177.6, "r_y1": 320.4, "r_x2": 177.6, "r_y2": 312.5, "r_x3": 171.5, "r_y3": 312.5, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.1, "r_y0": 500.6, "r_x1": 177.1, "r_y1": 500.6, "r_x2": 177.1, "r_y2": 492.7, "r_x3": 171.1, "r_y3": 492.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 633.4, "r_x1": 375.0, "r_y1": 633.4, "r_x2": 375.0, "r_y2": 627.5, "r_x3": 283.0, "r_y3": 627.5, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 623.3, "r_x1": 398.1, "r_y1": 623.3, "r_x2": 398.1, "r_y2": 617.4, "r_x3": 283.0, "r_y3": 617.4, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.6, "r_y0": 471.5, "r_x1": 437.5, "r_y1": 471.5, "r_x2": 437.5, "r_y2": 465.6, "r_x3": 293.6, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 294.3, "r_x1": 239.2, "r_y1": 294.3, "r_x2": 239.2, "r_y2": 288.4, "r_x3": 181.9, "r_y3": 288.4, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 300.8, "r_x1": 251.5, "r_y1": 300.8, "r_x2": 251.5, "r_y2": 294.9, "r_x3": 181.9, "r_y3": 294.9, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.8, "r_y0": 194.8, "r_x1": 253.6, "r_y1": 194.8, "r_x2": 253.6, "r_y2": 184.8, "r_x3": 247.8, "r_y3": 184.8, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.2, "r_y0": 613.7, "r_x1": 381.5, "r_y1": 613.7, "r_x2": 381.5, "r_y2": 607.8, "r_x3": 292.2, "r_y3": 607.8, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 403.4, "r_x1": 180.2, "r_y1": 403.4, "r_x2": 180.2, "r_y2": 381.4, "r_x3": 172.3, "r_y3": 381.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 578.7, "r_x1": 180.2, "r_y1": 578.7, "r_x2": 180.2, "r_y2": 555.8, "r_x3": 172.3, "r_y3": 555.8, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 18, "label": "text", "bbox": { "l": 171.5, "t": 312.5, "r": 177.6, "b": 320.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.4, "r_x1": 177.6, "r_y1": 320.4, "r_x2": 177.6, "r_y2": 312.5, "r_x3": 171.5, "r_y3": 312.5, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 171.1, "t": 492.7, "r": 177.1, "b": 500.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.1, "r_y0": 500.6, "r_x1": 177.1, "r_y1": 500.6, "r_x2": 177.1, "r_y2": 492.7, "r_x3": 171.1, "r_y3": 492.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 283.0, "t": 627.5, "r": 375.0, "b": 633.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 633.4, "r_x1": 375.0, "r_y1": 633.4, "r_x2": 375.0, "r_y2": 627.5, "r_x3": 283.0, "r_y3": 627.5, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 283.0, "t": 617.4, "r": 398.1, "b": 623.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 623.3, "r_x1": 398.1, "r_y1": 623.3, "r_x2": 398.1, "r_y2": 617.4, "r_x3": 283.0, "r_y3": 617.4, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 293.6, "t": 465.6, "r": 437.5, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.6, "r_y0": 471.5, "r_x1": 437.5, "r_y1": 471.5, "r_x2": 437.5, "r_y2": 465.6, "r_x3": 293.6, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 181.9, "t": 288.4, "r": 239.2, "b": 294.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 294.3, "r_x1": 239.2, "r_y1": 294.3, "r_x2": 239.2, "r_y2": 288.4, "r_x3": 181.9, "r_y3": 288.4, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 181.9, "t": 294.9, "r": 251.5, "b": 300.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 300.8, "r_x1": 251.5, "r_y1": 300.8, "r_x2": 251.5, "r_y2": 294.9, "r_x3": 181.9, "r_y3": 294.9, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 247.8, "t": 184.8, "r": 253.6, "b": 194.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.8, "r_y0": 194.8, "r_x1": 253.6, "r_y1": 194.8, "r_x2": 253.6, "r_y2": 184.8, "r_x3": 247.8, "r_y3": 184.8, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 292.2, "t": 607.8, "r": 381.5, "b": 613.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.2, "r_y0": 613.7, "r_x1": 381.5, "r_y1": 613.7, "r_x2": 381.5, "r_y2": 607.8, "r_x3": 292.2, "r_y3": 607.8, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 172.3, "t": 381.4, "r": 180.2, "b": 403.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 403.4, "r_x1": 180.2, "r_y1": 403.4, "r_x2": 180.2, "r_y2": 381.4, "r_x3": 172.3, "r_y3": 381.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 172.3, "t": 555.8, "r": 180.2, "b": 578.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 578.7, "r_x1": 180.2, "r_y1": 578.7, "r_x2": 180.2, "r_y2": 555.8, "r_x3": 172.3, "r_y3": 555.8, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 0, "page_no": 10, "cluster": { "id": 0, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 1, "page_no": 10, "cluster": { "id": 1, "label": "page_header", "bbox": { "l": 471.4, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.9, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.4, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 471.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11" }, { "label": "caption", "id": 2, "page_no": 10, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 134.8, "t": 125.8, "r": 480.6, "b": 177.8, "coord_origin": "TOPLEFT" }, "confidence": 0.87, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 133.7, "r_x1": 162.6, "r_y1": 133.7, "r_x2": 162.6, "r_y2": 125.8, "r_x3": 134.8, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.2, "r_y0": 133.9, "r_x1": 480.6, "r_y1": 133.9, "r_x2": 480.6, "r_y2": 125.9, "r_x3": 165.2, "r_y3": 125.9, "coord_origin": "TOPLEFT" }, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 144.9, "r_x1": 480.6, "r_y1": 144.9, "r_x2": 480.6, "r_y2": 136.8, "r_x3": 134.8, "r_y3": 136.8, "coord_origin": "TOPLEFT" }, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 155.8, "r_x1": 480.6, "r_y1": 155.8, "r_x2": 480.6, "r_y2": 147.8, "r_x3": 134.8, "r_y3": 147.8, "coord_origin": "TOPLEFT" }, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 166.8, "r_x1": 480.6, "r_y1": 166.8, "r_x2": 480.6, "r_y2": 158.7, "r_x3": 134.8, "r_y3": 158.7, "coord_origin": "TOPLEFT" }, "text": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 177.8, "r_x1": 415.8, "r_y1": 177.8, "r_x2": 415.8, "r_y2": 169.7, "r_x3": 134.8, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 6. Visualization of predicted structure and detected bounding boxes on a complex table with many rows. The OTSL model (B) captured repeating pattern of horizontally merged cells from the GT (A), unlike the HTML model (C). The HTML model also didn't complete the HTML sequence correctly and displayed a lot more of drift and overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet." }, { "label": "picture", "id": 3, "page_no": 10, "cluster": { "id": 3, "label": "picture", "bbox": { "l": 168.4, "t": 182.0, "r": 447.4, "b": 634.0, "coord_origin": "TOPLEFT" }, "confidence": 0.76, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.4, "r_x1": 177.6, "r_y1": 320.4, "r_x2": 177.6, "r_y2": 312.5, "r_x3": 171.5, "r_y3": 312.5, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.1, "r_y0": 500.6, "r_x1": 177.1, "r_y1": 500.6, "r_x2": 177.1, "r_y2": 492.7, "r_x3": 171.1, "r_y3": 492.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 633.4, "r_x1": 375.0, "r_y1": 633.4, "r_x2": 375.0, "r_y2": 627.5, "r_x3": 283.0, "r_y3": 627.5, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 623.3, "r_x1": 398.1, "r_y1": 623.3, "r_x2": 398.1, "r_y2": 617.4, "r_x3": 283.0, "r_y3": 617.4, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.6, "r_y0": 471.5, "r_x1": 437.5, "r_y1": 471.5, "r_x2": 437.5, "r_y2": 465.6, "r_x3": 293.6, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 294.3, "r_x1": 239.2, "r_y1": 294.3, "r_x2": 239.2, "r_y2": 288.4, "r_x3": 181.9, "r_y3": 288.4, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 300.8, "r_x1": 251.5, "r_y1": 300.8, "r_x2": 251.5, "r_y2": 294.9, "r_x3": 181.9, "r_y3": 294.9, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.8, "r_y0": 194.8, "r_x1": 253.6, "r_y1": 194.8, "r_x2": 253.6, "r_y2": 184.8, "r_x3": 247.8, "r_y3": 184.8, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.2, "r_y0": 613.7, "r_x1": 381.5, "r_y1": 613.7, "r_x2": 381.5, "r_y2": 607.8, "r_x3": 292.2, "r_y3": 607.8, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 403.4, "r_x1": 180.2, "r_y1": 403.4, "r_x2": 180.2, "r_y2": 381.4, "r_x3": 172.3, "r_y3": 381.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 578.7, "r_x1": 180.2, "r_y1": 578.7, "r_x2": 180.2, "r_y2": 555.8, "r_x3": 172.3, "r_y3": 555.8, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 18, "label": "text", "bbox": { "l": 171.5, "t": 312.5, "r": 177.6, "b": 320.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.4, "r_x1": 177.6, "r_y1": 320.4, "r_x2": 177.6, "r_y2": 312.5, "r_x3": 171.5, "r_y3": 312.5, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 171.1, "t": 492.7, "r": 177.1, "b": 500.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.1, "r_y0": 500.6, "r_x1": 177.1, "r_y1": 500.6, "r_x2": 177.1, "r_y2": 492.7, "r_x3": 171.1, "r_y3": 492.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 283.0, "t": 627.5, "r": 375.0, "b": 633.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 633.4, "r_x1": 375.0, "r_y1": 633.4, "r_x2": 375.0, "r_y2": 627.5, "r_x3": 283.0, "r_y3": 627.5, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 283.0, "t": 617.4, "r": 398.1, "b": 623.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 623.3, "r_x1": 398.1, "r_y1": 623.3, "r_x2": 398.1, "r_y2": 617.4, "r_x3": 283.0, "r_y3": 617.4, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 293.6, "t": 465.6, "r": 437.5, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.6, "r_y0": 471.5, "r_x1": 437.5, "r_y1": 471.5, "r_x2": 437.5, "r_y2": 465.6, "r_x3": 293.6, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 181.9, "t": 288.4, "r": 239.2, "b": 294.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 294.3, "r_x1": 239.2, "r_y1": 294.3, "r_x2": 239.2, "r_y2": 288.4, "r_x3": 181.9, "r_y3": 288.4, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 181.9, "t": 294.9, "r": 251.5, "b": 300.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 300.8, "r_x1": 251.5, "r_y1": 300.8, "r_x2": 251.5, "r_y2": 294.9, "r_x3": 181.9, "r_y3": 294.9, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 247.8, "t": 184.8, "r": 253.6, "b": 194.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.8, "r_y0": 194.8, "r_x1": 253.6, "r_y1": 194.8, "r_x2": 253.6, "r_y2": 184.8, "r_x3": 247.8, "r_y3": 184.8, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 292.2, "t": 607.8, "r": 381.5, "b": 613.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.2, "r_y0": 613.7, "r_x1": 381.5, "r_y1": 613.7, "r_x2": 381.5, "r_y2": 607.8, "r_x3": 292.2, "r_y3": 607.8, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 172.3, "t": 381.4, "r": 180.2, "b": 403.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 403.4, "r_x1": 180.2, "r_y1": 403.4, "r_x2": 180.2, "r_y2": 381.4, "r_x3": 172.3, "r_y3": 381.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 172.3, "t": 555.8, "r": 180.2, "b": 578.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 578.7, "r_x1": 180.2, "r_y1": 578.7, "r_x2": 180.2, "r_y2": 555.8, "r_x3": 172.3, "r_y3": 555.8, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "body": [ { "label": "caption", "id": 2, "page_no": 10, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 134.8, "t": 125.8, "r": 480.6, "b": 177.8, "coord_origin": "TOPLEFT" }, "confidence": 0.87, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 133.7, "r_x1": 162.6, "r_y1": 133.7, "r_x2": 162.6, "r_y2": 125.8, "r_x3": 134.8, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.2, "r_y0": 133.9, "r_x1": 480.6, "r_y1": 133.9, "r_x2": 480.6, "r_y2": 125.9, "r_x3": 165.2, "r_y3": 125.9, "coord_origin": "TOPLEFT" }, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 144.9, "r_x1": 480.6, "r_y1": 144.9, "r_x2": 480.6, "r_y2": 136.8, "r_x3": 134.8, "r_y3": 136.8, "coord_origin": "TOPLEFT" }, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 155.8, "r_x1": 480.6, "r_y1": 155.8, "r_x2": 480.6, "r_y2": 147.8, "r_x3": 134.8, "r_y3": 147.8, "coord_origin": "TOPLEFT" }, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 166.8, "r_x1": 480.6, "r_y1": 166.8, "r_x2": 480.6, "r_y2": 158.7, "r_x3": 134.8, "r_y3": 158.7, "coord_origin": "TOPLEFT" }, "text": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 177.8, "r_x1": 415.8, "r_y1": 177.8, "r_x2": 415.8, "r_y2": 169.7, "r_x3": 134.8, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 6. Visualization of predicted structure and detected bounding boxes on a complex table with many rows. The OTSL model (B) captured repeating pattern of horizontally merged cells from the GT (A), unlike the HTML model (C). The HTML model also didn't complete the HTML sequence correctly and displayed a lot more of drift and overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet." }, { "label": "picture", "id": 3, "page_no": 10, "cluster": { "id": 3, "label": "picture", "bbox": { "l": 168.4, "t": 182.0, "r": 447.4, "b": 634.0, "coord_origin": "TOPLEFT" }, "confidence": 0.76, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.4, "r_x1": 177.6, "r_y1": 320.4, "r_x2": 177.6, "r_y2": 312.5, "r_x3": 171.5, "r_y3": 312.5, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.1, "r_y0": 500.6, "r_x1": 177.1, "r_y1": 500.6, "r_x2": 177.1, "r_y2": 492.7, "r_x3": 171.1, "r_y3": 492.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 633.4, "r_x1": 375.0, "r_y1": 633.4, "r_x2": 375.0, "r_y2": 627.5, "r_x3": 283.0, "r_y3": 627.5, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 623.3, "r_x1": 398.1, "r_y1": 623.3, "r_x2": 398.1, "r_y2": 617.4, "r_x3": 283.0, "r_y3": 617.4, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.6, "r_y0": 471.5, "r_x1": 437.5, "r_y1": 471.5, "r_x2": 437.5, "r_y2": 465.6, "r_x3": 293.6, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 294.3, "r_x1": 239.2, "r_y1": 294.3, "r_x2": 239.2, "r_y2": 288.4, "r_x3": 181.9, "r_y3": 288.4, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 300.8, "r_x1": 251.5, "r_y1": 300.8, "r_x2": 251.5, "r_y2": 294.9, "r_x3": 181.9, "r_y3": 294.9, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.8, "r_y0": 194.8, "r_x1": 253.6, "r_y1": 194.8, "r_x2": 253.6, "r_y2": 184.8, "r_x3": 247.8, "r_y3": 184.8, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.2, "r_y0": 613.7, "r_x1": 381.5, "r_y1": 613.7, "r_x2": 381.5, "r_y2": 607.8, "r_x3": 292.2, "r_y3": 607.8, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 403.4, "r_x1": 180.2, "r_y1": 403.4, "r_x2": 180.2, "r_y2": 381.4, "r_x3": 172.3, "r_y3": 381.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 578.7, "r_x1": 180.2, "r_y1": 578.7, "r_x2": 180.2, "r_y2": 555.8, "r_x3": 172.3, "r_y3": 555.8, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 18, "label": "text", "bbox": { "l": 171.5, "t": 312.5, "r": 177.6, "b": 320.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.4, "r_x1": 177.6, "r_y1": 320.4, "r_x2": 177.6, "r_y2": 312.5, "r_x3": 171.5, "r_y3": 312.5, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 171.1, "t": 492.7, "r": 177.1, "b": 500.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.1, "r_y0": 500.6, "r_x1": 177.1, "r_y1": 500.6, "r_x2": 177.1, "r_y2": 492.7, "r_x3": 171.1, "r_y3": 492.7, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 283.0, "t": 627.5, "r": 375.0, "b": 633.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 633.4, "r_x1": 375.0, "r_y1": 633.4, "r_x2": 375.0, "r_y2": 627.5, "r_x3": 283.0, "r_y3": 627.5, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 283.0, "t": 617.4, "r": 398.1, "b": 623.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.0, "r_y0": 623.3, "r_x1": 398.1, "r_y1": 623.3, "r_x2": 398.1, "r_y2": 617.4, "r_x3": 283.0, "r_y3": 617.4, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 293.6, "t": 465.6, "r": 437.5, "b": 471.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.6, "r_y0": 471.5, "r_x1": 437.5, "r_y1": 471.5, "r_x2": 437.5, "r_y2": 465.6, "r_x3": 293.6, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 181.9, "t": 288.4, "r": 239.2, "b": 294.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 294.3, "r_x1": 239.2, "r_y1": 294.3, "r_x2": 239.2, "r_y2": 288.4, "r_x3": 181.9, "r_y3": 288.4, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 181.9, "t": 294.9, "r": 251.5, "b": 300.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.9, "r_y0": 300.8, "r_x1": 251.5, "r_y1": 300.8, "r_x2": 251.5, "r_y2": 294.9, "r_x3": 181.9, "r_y3": 294.9, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 247.8, "t": 184.8, "r": 253.6, "b": 194.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.8, "r_y0": 194.8, "r_x1": 253.6, "r_y1": 194.8, "r_x2": 253.6, "r_y2": 184.8, "r_x3": 247.8, "r_y3": 184.8, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 292.2, "t": 607.8, "r": 381.5, "b": 613.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.2, "r_y0": 613.7, "r_x1": 381.5, "r_y1": 613.7, "r_x2": 381.5, "r_y2": 607.8, "r_x3": 292.2, "r_y3": 607.8, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 172.3, "t": 381.4, "r": 180.2, "b": 403.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 403.4, "r_x1": 180.2, "r_y1": 403.4, "r_x2": 180.2, "r_y2": 381.4, "r_x3": 172.3, "r_y3": 381.4, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 172.3, "t": 555.8, "r": 180.2, "b": 578.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.3, "r_y0": 578.7, "r_x1": 180.2, "r_y1": 578.7, "r_x2": 180.2, "r_y2": 555.8, "r_x3": 172.3, "r_y3": 555.8, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "headers": [ { "label": "page_header", "id": 0, "page_no": 10, "cluster": { "id": 0, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 1, "page_no": 10, "cluster": { "id": 1, "label": "page_header", "bbox": { "l": 471.4, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.9, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.4, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 471.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11" } ] } }, { "page_no": 11, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 144.0, "r_y1": 101.8, "r_x2": 144.0, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 128.1, "r_x1": 141.5, "r_y1": 128.1, "r_x2": 141.5, "r_y2": 117.5, "r_x3": 134.8, "r_y3": 117.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 128.1, "r_x1": 219.3, "r_y1": 128.1, "r_x2": 219.3, "r_y2": 117.5, "r_x3": 154.9, "r_y3": 117.5, "coord_origin": "TOPLEFT" }, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 155.7, "r_x1": 480.6, "r_y1": 155.7, "r_x2": 480.6, "r_y2": 146.9, "r_x3": 134.8, "r_y3": 146.9, "coord_origin": "TOPLEFT" }, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 167.6, "r_x1": 480.6, "r_y1": 167.6, "r_x2": 480.6, "r_y2": 158.8, "r_x3": 134.8, "r_y3": 158.8, "coord_origin": "TOPLEFT" }, "text": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "orig": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 179.6, "r_x1": 480.6, "r_y1": 179.6, "r_x2": 480.6, "r_y2": 170.8, "r_x3": 134.8, "r_y3": 170.8, "coord_origin": "TOPLEFT" }, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 191.5, "r_x1": 480.6, "r_y1": 191.5, "r_x2": 480.6, "r_y2": 182.7, "r_x3": 134.8, "r_y3": 182.7, "coord_origin": "TOPLEFT" }, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 203.5, "r_x1": 239.5, "r_y1": 203.5, "r_x2": 239.5, "r_y2": 194.7, "r_x3": 134.8, "r_y3": 194.7, "coord_origin": "TOPLEFT" }, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 216.2, "r_x1": 480.6, "r_y1": 216.2, "r_x2": 480.6, "r_y2": 207.4, "r_x3": 149.7, "r_y3": 207.4, "coord_origin": "TOPLEFT" }, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 228.2, "r_x1": 480.6, "r_y1": 228.2, "r_x2": 480.6, "r_y2": 219.4, "r_x3": 134.8, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 240.2, "r_x1": 480.6, "r_y1": 240.2, "r_x2": 480.6, "r_y2": 231.4, "r_x3": 134.8, "r_y3": 231.4, "coord_origin": "TOPLEFT" }, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 252.1, "r_x1": 480.6, "r_y1": 252.1, "r_x2": 480.6, "r_y2": 243.3, "r_x3": 134.8, "r_y3": 243.3, "coord_origin": "TOPLEFT" }, "text": "OTSL representation. Additional performance benefits can be obtained with", "orig": "OTSL representation. Additional performance benefits can be obtained with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 264.1, "r_x1": 480.6, "r_y1": 264.1, "r_x2": 480.6, "r_y2": 255.3, "r_x3": 134.8, "r_y3": 255.3, "coord_origin": "TOPLEFT" }, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 276.0, "r_x1": 480.6, "r_y1": 276.0, "r_x2": 480.6, "r_y2": 267.2, "r_x3": 134.8, "r_y3": 267.2, "coord_origin": "TOPLEFT" }, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 288.0, "r_x1": 480.6, "r_y1": 288.0, "r_x2": 480.6, "r_y2": 279.2, "r_x3": 134.8, "r_y3": 279.2, "coord_origin": "TOPLEFT" }, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 299.9, "r_x1": 480.6, "r_y1": 299.9, "r_x2": 480.6, "r_y2": 291.1, "r_x3": 134.8, "r_y3": 291.1, "coord_origin": "TOPLEFT" }, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 311.9, "r_x1": 480.6, "r_y1": 311.9, "r_x2": 480.6, "r_y2": 303.1, "r_x3": 134.8, "r_y3": 303.1, "coord_origin": "TOPLEFT" }, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 323.8, "r_x1": 240.9, "r_y1": 323.8, "r_x2": 240.9, "r_y2": 315.0, "r_x3": 134.8, "r_y3": 315.0, "coord_origin": "TOPLEFT" }, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 336.6, "r_x1": 480.6, "r_y1": 336.6, "r_x2": 480.6, "r_y2": 327.8, "r_x3": 149.7, "r_y3": 327.8, "coord_origin": "TOPLEFT" }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 348.6, "r_x1": 480.6, "r_y1": 348.6, "r_x2": 480.6, "r_y2": 339.8, "r_x3": 134.8, "r_y3": 339.8, "coord_origin": "TOPLEFT" }, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 360.5, "r_x1": 480.6, "r_y1": 360.5, "r_x2": 480.6, "r_y2": 351.7, "r_x3": 134.8, "r_y3": 351.7, "coord_origin": "TOPLEFT" }, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 372.5, "r_x1": 480.6, "r_y1": 372.5, "r_x2": 480.6, "r_y2": 363.7, "r_x3": 134.8, "r_y3": 363.7, "coord_origin": "TOPLEFT" }, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 384.4, "r_x1": 480.6, "r_y1": 384.4, "r_x2": 480.6, "r_y2": 375.6, "r_x3": 134.8, "r_y3": 375.6, "coord_origin": "TOPLEFT" }, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 396.4, "r_x1": 480.6, "r_y1": 396.4, "r_x2": 480.6, "r_y2": 387.6, "r_x3": 134.8, "r_y3": 387.6, "coord_origin": "TOPLEFT" }, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 408.3, "r_x1": 480.6, "r_y1": 408.3, "r_x2": 480.6, "r_y2": 399.5, "r_x3": 134.8, "r_y3": 399.5, "coord_origin": "TOPLEFT" }, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 420.3, "r_x1": 480.6, "r_y1": 420.3, "r_x2": 480.6, "r_y2": 411.5, "r_x3": 134.8, "r_y3": 411.5, "coord_origin": "TOPLEFT" }, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 432.2, "r_x1": 480.6, "r_y1": 432.2, "r_x2": 480.6, "r_y2": 423.4, "r_x3": 134.8, "r_y3": 423.4, "coord_origin": "TOPLEFT" }, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 444.2, "r_x1": 480.6, "r_y1": 444.2, "r_x2": 480.6, "r_y2": 435.4, "r_x3": 134.8, "r_y3": 435.4, "coord_origin": "TOPLEFT" }, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 456.1, "r_x1": 480.6, "r_y1": 456.1, "r_x2": 480.6, "r_y2": 447.4, "r_x3": 134.8, "r_y3": 447.4, "coord_origin": "TOPLEFT" }, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 468.1, "r_x1": 366.8, "r_y1": 468.1, "r_x2": 366.8, "r_y2": 459.3, "r_x3": 134.8, "r_y3": 459.3, "coord_origin": "TOPLEFT" }, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 504.4, "r_x1": 197.7, "r_y1": 504.4, "r_x2": 197.7, "r_y2": 493.8, "r_x3": 134.8, "r_y3": 493.8, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 530.9, "r_x1": 146.5, "r_y1": 530.9, "r_x2": 146.5, "r_y2": 522.9, "r_x3": 139.4, "r_y3": 522.9, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.0, "r_y0": 530.9, "r_x1": 480.6, "r_y1": 530.9, "r_x2": 480.6, "r_y2": 522.9, "r_x3": 151.0, "r_y3": 522.9, "coord_origin": "TOPLEFT" }, "text": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "orig": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 541.9, "r_x1": 480.6, "r_y1": 541.9, "r_x2": 480.6, "r_y2": 533.8, "r_x3": 151.5, "r_y3": 533.8, "coord_origin": "TOPLEFT" }, "text": "ument conversion as a cloud service with high throughput and responsiveness.", "orig": "ument conversion as a cloud service with high throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 552.9, "r_x1": 176.3, "r_y1": 552.9, "r_x2": 176.3, "r_y2": 544.8, "r_x3": 151.5, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.5, "r_y0": 552.7, "r_x1": 250.7, "r_y1": 552.7, "r_x2": 250.7, "r_y2": 544.7, "r_x3": 179.5, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.8, "r_y0": 552.9, "r_x1": 282.0, "r_y1": 552.9, "r_x2": 282.0, "r_y2": 544.8, "r_x3": 253.8, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.1, "r_y0": 552.9, "r_x1": 478.0, "r_y1": 552.9, "r_x2": 478.0, "r_y2": 545.4, "r_x3": 285.1, "r_y3": 545.4, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0, "r_y0": 552.9, "r_x1": 480.6, "r_y1": 552.9, "r_x2": 480.6, "r_y2": 544.8, "r_x3": 478.0, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 563.9, "r_x1": 344.5, "r_y1": 563.9, "r_x2": 344.5, "r_y2": 556.4, "r_x3": 151.5, "r_y3": 556.4, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 575.6, "r_x1": 145.9, "r_y1": 575.6, "r_x2": 145.9, "r_y2": 567.5, "r_x3": 139.4, "r_y3": 567.5, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.2, "r_y0": 575.6, "r_x1": 480.6, "r_y1": 575.6, "r_x2": 480.6, "r_y2": 567.5, "r_x3": 150.2, "r_y3": 567.5, "coord_origin": "TOPLEFT" }, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 586.5, "r_x1": 480.6, "r_y1": 586.5, "r_x2": 480.6, "r_y2": 578.5, "r_x3": 151.5, "r_y3": 578.5, "coord_origin": "TOPLEFT" }, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 597.5, "r_x1": 480.6, "r_y1": 597.5, "r_x2": 480.6, "r_y2": 589.4, "r_x3": 151.5, "r_y3": 589.4, "coord_origin": "TOPLEFT" }, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 608.5, "r_x1": 364.2, "r_y1": 608.5, "r_x2": 364.2, "r_y2": 600.4, "r_x3": 151.5, "r_y3": 600.4, "coord_origin": "TOPLEFT" }, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 620.2, "r_x1": 146.4, "r_y1": 620.2, "r_x2": 146.4, "r_y2": 612.2, "r_x3": 139.4, "r_y3": 612.2, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.0, "r_y0": 620.2, "r_x1": 480.6, "r_y1": 620.2, "r_x2": 480.6, "r_y2": 612.2, "r_x3": 151.0, "r_y3": 612.2, "coord_origin": "TOPLEFT" }, "text": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 631.2, "r_x1": 400.2, "r_y1": 631.2, "r_x2": 400.2, "r_y2": 623.1, "r_x3": 151.5, "r_y3": 623.1, "coord_origin": "TOPLEFT" }, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 643.0, "r_x1": 146.5, "r_y1": 643.0, "r_x2": 146.5, "r_y2": 634.9, "r_x3": 139.4, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.1, "r_y0": 643.0, "r_x1": 480.6, "r_y1": 643.0, "r_x2": 480.6, "r_y2": 634.9, "r_x3": 151.1, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "orig": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 653.9, "r_x1": 480.6, "r_y1": 653.9, "r_x2": 480.6, "r_y2": 645.8, "r_x3": 151.5, "r_y3": 645.8, "coord_origin": "TOPLEFT" }, "text": "table recognition. In: 2019 International Conference on Document Analysis and", "orig": "table recognition. In: 2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 664.9, "r_x1": 350.1, "r_y1": 664.9, "r_x2": 350.1, "r_y2": 656.8, "r_x3": 151.5, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 10, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 144.0, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 144.0, "r_y1": 101.8, "r_x2": 144.0, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "section_header", "bbox": { "l": 134.8, "t": 117.5, "r": 219.3, "b": 128.1, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 128.1, "r_x1": 141.5, "r_y1": 128.1, "r_x2": 141.5, "r_y2": 117.5, "r_x3": 134.8, "r_y3": 117.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 128.1, "r_x1": 219.3, "r_y1": 128.1, "r_x2": 219.3, "r_y2": 117.5, "r_x3": 154.9, "r_y3": 117.5, "coord_origin": "TOPLEFT" }, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 146.9, "r": 480.6, "b": 203.5, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 155.7, "r_x1": 480.6, "r_y1": 155.7, "r_x2": 480.6, "r_y2": 146.9, "r_x3": 134.8, "r_y3": 146.9, "coord_origin": "TOPLEFT" }, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 167.6, "r_x1": 480.6, "r_y1": 167.6, "r_x2": 480.6, "r_y2": 158.8, "r_x3": 134.8, "r_y3": 158.8, "coord_origin": "TOPLEFT" }, "text": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "orig": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 179.6, "r_x1": 480.6, "r_y1": 179.6, "r_x2": 480.6, "r_y2": 170.8, "r_x3": 134.8, "r_y3": 170.8, "coord_origin": "TOPLEFT" }, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 191.5, "r_x1": 480.6, "r_y1": 191.5, "r_x2": 480.6, "r_y2": 182.7, "r_x3": 134.8, "r_y3": 182.7, "coord_origin": "TOPLEFT" }, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 203.5, "r_x1": 239.5, "r_y1": 203.5, "r_x2": 239.5, "r_y2": 194.7, "r_x3": 134.8, "r_y3": 194.7, "coord_origin": "TOPLEFT" }, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 207.4, "r": 480.6, "b": 323.8, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 216.2, "r_x1": 480.6, "r_y1": 216.2, "r_x2": 480.6, "r_y2": 207.4, "r_x3": 149.7, "r_y3": 207.4, "coord_origin": "TOPLEFT" }, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 228.2, "r_x1": 480.6, "r_y1": 228.2, "r_x2": 480.6, "r_y2": 219.4, "r_x3": 134.8, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 240.2, "r_x1": 480.6, "r_y1": 240.2, "r_x2": 480.6, "r_y2": 231.4, "r_x3": 134.8, "r_y3": 231.4, "coord_origin": "TOPLEFT" }, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 252.1, "r_x1": 480.6, "r_y1": 252.1, "r_x2": 480.6, "r_y2": 243.3, "r_x3": 134.8, "r_y3": 243.3, "coord_origin": "TOPLEFT" }, "text": "OTSL representation. Additional performance benefits can be obtained with", "orig": "OTSL representation. Additional performance benefits can be obtained with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 264.1, "r_x1": 480.6, "r_y1": 264.1, "r_x2": 480.6, "r_y2": 255.3, "r_x3": 134.8, "r_y3": 255.3, "coord_origin": "TOPLEFT" }, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 276.0, "r_x1": 480.6, "r_y1": 276.0, "r_x2": 480.6, "r_y2": 267.2, "r_x3": 134.8, "r_y3": 267.2, "coord_origin": "TOPLEFT" }, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 288.0, "r_x1": 480.6, "r_y1": 288.0, "r_x2": 480.6, "r_y2": 279.2, "r_x3": 134.8, "r_y3": 279.2, "coord_origin": "TOPLEFT" }, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 299.9, "r_x1": 480.6, "r_y1": 299.9, "r_x2": 480.6, "r_y2": 291.1, "r_x3": 134.8, "r_y3": 291.1, "coord_origin": "TOPLEFT" }, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 311.9, "r_x1": 480.6, "r_y1": 311.9, "r_x2": 480.6, "r_y2": 303.1, "r_x3": 134.8, "r_y3": 303.1, "coord_origin": "TOPLEFT" }, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 323.8, "r_x1": 240.9, "r_y1": 323.8, "r_x2": 240.9, "r_y2": 315.0, "r_x3": 134.8, "r_y3": 315.0, "coord_origin": "TOPLEFT" }, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 327.8, "r": 480.6, "b": 468.1, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 336.6, "r_x1": 480.6, "r_y1": 336.6, "r_x2": 480.6, "r_y2": 327.8, "r_x3": 149.7, "r_y3": 327.8, "coord_origin": "TOPLEFT" }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 348.6, "r_x1": 480.6, "r_y1": 348.6, "r_x2": 480.6, "r_y2": 339.8, "r_x3": 134.8, "r_y3": 339.8, "coord_origin": "TOPLEFT" }, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 360.5, "r_x1": 480.6, "r_y1": 360.5, "r_x2": 480.6, "r_y2": 351.7, "r_x3": 134.8, "r_y3": 351.7, "coord_origin": "TOPLEFT" }, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 372.5, "r_x1": 480.6, "r_y1": 372.5, "r_x2": 480.6, "r_y2": 363.7, "r_x3": 134.8, "r_y3": 363.7, "coord_origin": "TOPLEFT" }, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 384.4, "r_x1": 480.6, "r_y1": 384.4, "r_x2": 480.6, "r_y2": 375.6, "r_x3": 134.8, "r_y3": 375.6, "coord_origin": "TOPLEFT" }, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 396.4, "r_x1": 480.6, "r_y1": 396.4, "r_x2": 480.6, "r_y2": 387.6, "r_x3": 134.8, "r_y3": 387.6, "coord_origin": "TOPLEFT" }, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 408.3, "r_x1": 480.6, "r_y1": 408.3, "r_x2": 480.6, "r_y2": 399.5, "r_x3": 134.8, "r_y3": 399.5, "coord_origin": "TOPLEFT" }, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 420.3, "r_x1": 480.6, "r_y1": 420.3, "r_x2": 480.6, "r_y2": 411.5, "r_x3": 134.8, "r_y3": 411.5, "coord_origin": "TOPLEFT" }, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 432.2, "r_x1": 480.6, "r_y1": 432.2, "r_x2": 480.6, "r_y2": 423.4, "r_x3": 134.8, "r_y3": 423.4, "coord_origin": "TOPLEFT" }, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 444.2, "r_x1": 480.6, "r_y1": 444.2, "r_x2": 480.6, "r_y2": 435.4, "r_x3": 134.8, "r_y3": 435.4, "coord_origin": "TOPLEFT" }, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 456.1, "r_x1": 480.6, "r_y1": 456.1, "r_x2": 480.6, "r_y2": 447.4, "r_x3": 134.8, "r_y3": 447.4, "coord_origin": "TOPLEFT" }, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 468.1, "r_x1": 366.8, "r_y1": 468.1, "r_x2": 366.8, "r_y2": 459.3, "r_x3": 134.8, "r_y3": 459.3, "coord_origin": "TOPLEFT" }, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "section_header", "bbox": { "l": 134.8, "t": 493.8, "r": 197.7, "b": 504.4, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 504.4, "r_x1": 197.7, "r_y1": 504.4, "r_x2": 197.7, "r_y2": 493.8, "r_x3": 134.8, "r_y3": 493.8, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 139.4, "t": 522.9, "r": 480.6, "b": 563.9, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 530.9, "r_x1": 146.5, "r_y1": 530.9, "r_x2": 146.5, "r_y2": 522.9, "r_x3": 139.4, "r_y3": 522.9, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.0, "r_y0": 530.9, "r_x1": 480.6, "r_y1": 530.9, "r_x2": 480.6, "r_y2": 522.9, "r_x3": 151.0, "r_y3": 522.9, "coord_origin": "TOPLEFT" }, "text": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "orig": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 541.9, "r_x1": 480.6, "r_y1": 541.9, "r_x2": 480.6, "r_y2": 533.8, "r_x3": 151.5, "r_y3": 533.8, "coord_origin": "TOPLEFT" }, "text": "ument conversion as a cloud service with high throughput and responsiveness.", "orig": "ument conversion as a cloud service with high throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 552.9, "r_x1": 176.3, "r_y1": 552.9, "r_x2": 176.3, "r_y2": 544.8, "r_x3": 151.5, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.5, "r_y0": 552.7, "r_x1": 250.7, "r_y1": 552.7, "r_x2": 250.7, "r_y2": 544.7, "r_x3": 179.5, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.8, "r_y0": 552.9, "r_x1": 282.0, "r_y1": 552.9, "r_x2": 282.0, "r_y2": 544.8, "r_x3": 253.8, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.1, "r_y0": 552.9, "r_x1": 478.0, "r_y1": 552.9, "r_x2": 478.0, "r_y2": 545.4, "r_x3": 285.1, "r_y3": 545.4, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0, "r_y0": 552.9, "r_x1": 480.6, "r_y1": 552.9, "r_x2": 480.6, "r_y2": 544.8, "r_x3": 478.0, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 563.9, "r_x1": 344.5, "r_y1": 563.9, "r_x2": 344.5, "r_y2": 556.4, "r_x3": 151.5, "r_y3": 556.4, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 139.4, "t": 567.5, "r": 480.6, "b": 608.5, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 575.6, "r_x1": 145.9, "r_y1": 575.6, "r_x2": 145.9, "r_y2": 567.5, "r_x3": 139.4, "r_y3": 567.5, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.2, "r_y0": 575.6, "r_x1": 480.6, "r_y1": 575.6, "r_x2": 480.6, "r_y2": 567.5, "r_x3": 150.2, "r_y3": 567.5, "coord_origin": "TOPLEFT" }, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 586.5, "r_x1": 480.6, "r_y1": 586.5, "r_x2": 480.6, "r_y2": 578.5, "r_x3": 151.5, "r_y3": 578.5, "coord_origin": "TOPLEFT" }, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 597.5, "r_x1": 480.6, "r_y1": 597.5, "r_x2": 480.6, "r_y2": 589.4, "r_x3": 151.5, "r_y3": 589.4, "coord_origin": "TOPLEFT" }, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 608.5, "r_x1": 364.2, "r_y1": 608.5, "r_x2": 364.2, "r_y2": 600.4, "r_x3": 151.5, "r_y3": 600.4, "coord_origin": "TOPLEFT" }, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 139.4, "t": 612.2, "r": 480.6, "b": 631.2, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 620.2, "r_x1": 146.4, "r_y1": 620.2, "r_x2": 146.4, "r_y2": 612.2, "r_x3": 139.4, "r_y3": 612.2, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.0, "r_y0": 620.2, "r_x1": 480.6, "r_y1": 620.2, "r_x2": 480.6, "r_y2": 612.2, "r_x3": 151.0, "r_y3": 612.2, "coord_origin": "TOPLEFT" }, "text": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 631.2, "r_x1": 400.2, "r_y1": 631.2, "r_x2": 400.2, "r_y2": 623.1, "r_x3": 151.5, "r_y3": 623.1, "coord_origin": "TOPLEFT" }, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 139.4, "t": 634.9, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 643.0, "r_x1": 146.5, "r_y1": 643.0, "r_x2": 146.5, "r_y2": 634.9, "r_x3": 139.4, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.1, "r_y0": 643.0, "r_x1": 480.6, "r_y1": 643.0, "r_x2": 480.6, "r_y2": 634.9, "r_x3": 151.1, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "orig": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 653.9, "r_x1": 480.6, "r_y1": 653.9, "r_x2": 480.6, "r_y2": 645.8, "r_x3": 151.5, "r_y3": 645.8, "coord_origin": "TOPLEFT" }, "text": "table recognition. In: 2019 International Conference on Document Analysis and", "orig": "table recognition. In: 2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 664.9, "r_x1": 350.1, "r_y1": 664.9, "r_x2": 350.1, "r_y2": 656.8, "r_x3": 151.5, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 10, "page_no": 11, "cluster": { "id": 10, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 144.0, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 144.0, "r_y1": 101.8, "r_x2": 144.0, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12" }, { "label": "page_header", "id": 9, "page_no": 11, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "section_header", "id": 8, "page_no": 11, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 134.8, "t": 117.5, "r": 219.3, "b": 128.1, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 128.1, "r_x1": 141.5, "r_y1": 128.1, "r_x2": 141.5, "r_y2": 117.5, "r_x3": 134.8, "r_y3": 117.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 128.1, "r_x1": 219.3, "r_y1": 128.1, "r_x2": 219.3, "r_y2": 117.5, "r_x3": 154.9, "r_y3": 117.5, "coord_origin": "TOPLEFT" }, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6 Conclusion" }, { "label": "text", "id": 2, "page_no": 11, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 146.9, "r": 480.6, "b": 203.5, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 155.7, "r_x1": 480.6, "r_y1": 155.7, "r_x2": 480.6, "r_y2": 146.9, "r_x3": 134.8, "r_y3": 146.9, "coord_origin": "TOPLEFT" }, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 167.6, "r_x1": 480.6, "r_y1": 167.6, "r_x2": 480.6, "r_y2": 158.8, "r_x3": 134.8, "r_y3": 158.8, "coord_origin": "TOPLEFT" }, "text": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "orig": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 179.6, "r_x1": 480.6, "r_y1": 179.6, "r_x2": 480.6, "r_y2": 170.8, "r_x3": 134.8, "r_y3": 170.8, "coord_origin": "TOPLEFT" }, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 191.5, "r_x1": 480.6, "r_y1": 191.5, "r_x2": 480.6, "r_y2": 182.7, "r_x3": 134.8, "r_y3": 182.7, "coord_origin": "TOPLEFT" }, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 203.5, "r_x1": 239.5, "r_y1": 203.5, "r_x2": 239.5, "r_y2": 194.7, "r_x3": 134.8, "r_y3": 194.7, "coord_origin": "TOPLEFT" }, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We demonstrated that representing tables in HTML for the task of table structure recognition with Im2Seq models is ill-suited and has serious limitations. Furthermore, we presented in this paper an Optimized Table Structure Language (OTSL) which, when compared to commonly used general purpose languages, has several key benefits." }, { "label": "text", "id": 0, "page_no": 11, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 207.4, "r": 480.6, "b": 323.8, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 216.2, "r_x1": 480.6, "r_y1": 216.2, "r_x2": 480.6, "r_y2": 207.4, "r_x3": 149.7, "r_y3": 207.4, "coord_origin": "TOPLEFT" }, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 228.2, "r_x1": 480.6, "r_y1": 228.2, "r_x2": 480.6, "r_y2": 219.4, "r_x3": 134.8, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 240.2, "r_x1": 480.6, "r_y1": 240.2, "r_x2": 480.6, "r_y2": 231.4, "r_x3": 134.8, "r_y3": 231.4, "coord_origin": "TOPLEFT" }, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 252.1, "r_x1": 480.6, "r_y1": 252.1, "r_x2": 480.6, "r_y2": 243.3, "r_x3": 134.8, "r_y3": 243.3, "coord_origin": "TOPLEFT" }, "text": "OTSL representation. Additional performance benefits can be obtained with", "orig": "OTSL representation. Additional performance benefits can be obtained with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 264.1, "r_x1": 480.6, "r_y1": 264.1, "r_x2": 480.6, "r_y2": 255.3, "r_x3": 134.8, "r_y3": 255.3, "coord_origin": "TOPLEFT" }, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 276.0, "r_x1": 480.6, "r_y1": 276.0, "r_x2": 480.6, "r_y2": 267.2, "r_x3": 134.8, "r_y3": 267.2, "coord_origin": "TOPLEFT" }, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 288.0, "r_x1": 480.6, "r_y1": 288.0, "r_x2": 480.6, "r_y2": 279.2, "r_x3": 134.8, "r_y3": 279.2, "coord_origin": "TOPLEFT" }, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 299.9, "r_x1": 480.6, "r_y1": 299.9, "r_x2": 480.6, "r_y2": 291.1, "r_x3": 134.8, "r_y3": 291.1, "coord_origin": "TOPLEFT" }, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 311.9, "r_x1": 480.6, "r_y1": 311.9, "r_x2": 480.6, "r_y2": 303.1, "r_x3": 134.8, "r_y3": 303.1, "coord_origin": "TOPLEFT" }, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 323.8, "r_x1": 240.9, "r_y1": 323.8, "r_x2": 240.9, "r_y2": 315.0, "r_x3": 134.8, "r_y3": 315.0, "coord_origin": "TOPLEFT" }, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "First and foremost, given the same network configuration, inference time for a table-structure prediction is about 2 times faster compared to the conventional HTML approach. This is primarily owed to the shorter sequence length of the OTSL representation. Additional performance benefits can be obtained with HPO (hyper parameter optimization). As we demonstrate in our experiments, models trained on OTSL can be significantly smaller, e.g. by reducing the number of encoder and decoder layers, while preserving comparatively good prediction quality. This can further improve inference performance, yielding 5-6 times faster inference speed in OTSL with prediction quality comparable to models trained on HTML (see Table 1)." }, { "label": "text", "id": 1, "page_no": 11, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 327.8, "r": 480.6, "b": 468.1, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 336.6, "r_x1": 480.6, "r_y1": 336.6, "r_x2": 480.6, "r_y2": 327.8, "r_x3": 149.7, "r_y3": 327.8, "coord_origin": "TOPLEFT" }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 348.6, "r_x1": 480.6, "r_y1": 348.6, "r_x2": 480.6, "r_y2": 339.8, "r_x3": 134.8, "r_y3": 339.8, "coord_origin": "TOPLEFT" }, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 360.5, "r_x1": 480.6, "r_y1": 360.5, "r_x2": 480.6, "r_y2": 351.7, "r_x3": 134.8, "r_y3": 351.7, "coord_origin": "TOPLEFT" }, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 372.5, "r_x1": 480.6, "r_y1": 372.5, "r_x2": 480.6, "r_y2": 363.7, "r_x3": 134.8, "r_y3": 363.7, "coord_origin": "TOPLEFT" }, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 384.4, "r_x1": 480.6, "r_y1": 384.4, "r_x2": 480.6, "r_y2": 375.6, "r_x3": 134.8, "r_y3": 375.6, "coord_origin": "TOPLEFT" }, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 396.4, "r_x1": 480.6, "r_y1": 396.4, "r_x2": 480.6, "r_y2": 387.6, "r_x3": 134.8, "r_y3": 387.6, "coord_origin": "TOPLEFT" }, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 408.3, "r_x1": 480.6, "r_y1": 408.3, "r_x2": 480.6, "r_y2": 399.5, "r_x3": 134.8, "r_y3": 399.5, "coord_origin": "TOPLEFT" }, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 420.3, "r_x1": 480.6, "r_y1": 420.3, "r_x2": 480.6, "r_y2": 411.5, "r_x3": 134.8, "r_y3": 411.5, "coord_origin": "TOPLEFT" }, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 432.2, "r_x1": 480.6, "r_y1": 432.2, "r_x2": 480.6, "r_y2": 423.4, "r_x3": 134.8, "r_y3": 423.4, "coord_origin": "TOPLEFT" }, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 444.2, "r_x1": 480.6, "r_y1": 444.2, "r_x2": 480.6, "r_y2": 435.4, "r_x3": 134.8, "r_y3": 435.4, "coord_origin": "TOPLEFT" }, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 456.1, "r_x1": 480.6, "r_y1": 456.1, "r_x2": 480.6, "r_y2": 447.4, "r_x3": 134.8, "r_y3": 447.4, "coord_origin": "TOPLEFT" }, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 468.1, "r_x1": 366.8, "r_y1": 468.1, "r_x2": 366.8, "r_y2": 459.3, "r_x3": 134.8, "r_y3": 459.3, "coord_origin": "TOPLEFT" }, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vocabulary size. This allows autoregressive models to perform better in the TED metric, but especially with regards to prediction accuracy of the table-cell bounding boxes (see Table 2). As shown in Figure 5, we observe that the OTSL drastically reduces the drift for table cell bounding boxes at high row count and in sparse tables. This leads to more accurate predictions and a significant reduction in post-processing complexity, which is an undesired necessity in HTML-based Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few, simple and always backwards looking. Each new token can be validated only by analyzing the sequence of previous tokens, without requiring the entire sequence to detect mistakes. This in return allows to perform structural error detection and correction on-the-fly during sequence generation." }, { "label": "section_header", "id": 7, "page_no": 11, "cluster": { "id": 7, "label": "section_header", "bbox": { "l": 134.8, "t": 493.8, "r": 197.7, "b": 504.4, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 504.4, "r_x1": 197.7, "r_y1": 504.4, "r_x2": 197.7, "r_y2": 493.8, "r_x3": 134.8, "r_y3": 493.8, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "References" }, { "label": "list_item", "id": 5, "page_no": 11, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.4, "t": 522.9, "r": 480.6, "b": 563.9, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 530.9, "r_x1": 146.5, "r_y1": 530.9, "r_x2": 146.5, "r_y2": 522.9, "r_x3": 139.4, "r_y3": 522.9, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.0, "r_y0": 530.9, "r_x1": 480.6, "r_y1": 530.9, "r_x2": 480.6, "r_y2": 522.9, "r_x3": 151.0, "r_y3": 522.9, "coord_origin": "TOPLEFT" }, "text": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "orig": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 541.9, "r_x1": 480.6, "r_y1": 541.9, "r_x2": 480.6, "r_y2": 533.8, "r_x3": 151.5, "r_y3": 533.8, "coord_origin": "TOPLEFT" }, "text": "ument conversion as a cloud service with high throughput and responsiveness.", "orig": "ument conversion as a cloud service with high throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 552.9, "r_x1": 176.3, "r_y1": 552.9, "r_x2": 176.3, "r_y2": 544.8, "r_x3": 151.5, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.5, "r_y0": 552.7, "r_x1": 250.7, "r_y1": 552.7, "r_x2": 250.7, "r_y2": 544.7, "r_x3": 179.5, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.8, "r_y0": 552.9, "r_x1": 282.0, "r_y1": 552.9, "r_x2": 282.0, "r_y2": 544.8, "r_x3": 253.8, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.1, "r_y0": 552.9, "r_x1": 478.0, "r_y1": 552.9, "r_x2": 478.0, "r_y2": 545.4, "r_x3": 285.1, "r_y3": 545.4, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0, "r_y0": 552.9, "r_x1": 480.6, "r_y1": 552.9, "r_x2": 480.6, "r_y2": 544.8, "r_x3": 478.0, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 563.9, "r_x1": 344.5, "r_y1": 563.9, "r_x2": 344.5, "r_y2": 556.4, "r_x3": 151.5, "r_y3": 556.4, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering document conversion as a cloud service with high throughput and responsiveness. CoRR abs/2206.00785 (2022). https://doi.org/10.48550/arXiv.2206.00785 , https://doi.org/10.48550/arXiv.2206.00785" }, { "label": "list_item", "id": 4, "page_no": 11, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.4, "t": 567.5, "r": 480.6, "b": 608.5, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 575.6, "r_x1": 145.9, "r_y1": 575.6, "r_x2": 145.9, "r_y2": 567.5, "r_x3": 139.4, "r_y3": 567.5, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.2, "r_y0": 575.6, "r_x1": 480.6, "r_y1": 575.6, "r_x2": 480.6, "r_y2": 567.5, "r_x3": 150.2, "r_y3": 567.5, "coord_origin": "TOPLEFT" }, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 586.5, "r_x1": 480.6, "r_y1": 586.5, "r_x2": 480.6, "r_y2": 578.5, "r_x3": 151.5, "r_y3": 578.5, "coord_origin": "TOPLEFT" }, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 597.5, "r_x1": 480.6, "r_y1": 597.5, "r_x2": 480.6, "r_y2": 589.4, "r_x3": 151.5, "r_y3": 589.4, "coord_origin": "TOPLEFT" }, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 608.5, "r_x1": 364.2, "r_y1": 608.5, "r_x2": 364.2, "r_y2": 600.4, "r_x3": 151.5, "r_y3": 600.4, "coord_origin": "TOPLEFT" }, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition in the wild using transformer and identity matrix-based augmentation. In: Porwal, U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545561. Springer International Publishing, Cham (2022)" }, { "label": "list_item", "id": 6, "page_no": 11, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 139.4, "t": 612.2, "r": 480.6, "b": 631.2, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 620.2, "r_x1": 146.4, "r_y1": 620.2, "r_x2": 146.4, "r_y2": 612.2, "r_x3": 139.4, "r_y3": 612.2, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.0, "r_y0": 620.2, "r_x1": 480.6, "r_y1": 620.2, "r_x2": 480.6, "r_y2": 612.2, "r_x3": 151.0, "r_y3": 612.2, "coord_origin": "TOPLEFT" }, "text": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 631.2, "r_x1": 400.2, "r_y1": 631.2, "r_x2": 400.2, "r_y2": 623.1, "r_x3": 151.5, "r_y3": 623.1, "coord_origin": "TOPLEFT" }, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table structure recognition. arXiv preprint arXiv:1908.04729 (2019)" }, { "label": "list_item", "id": 3, "page_no": 11, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 139.4, "t": 634.9, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 643.0, "r_x1": 146.5, "r_y1": 643.0, "r_x2": 146.5, "r_y2": 634.9, "r_x3": 139.4, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.1, "r_y0": 643.0, "r_x1": 480.6, "r_y1": 643.0, "r_x2": 480.6, "r_y2": 634.9, "r_x3": 151.1, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "orig": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 653.9, "r_x1": 480.6, "r_y1": 653.9, "r_x2": 480.6, "r_y2": 645.8, "r_x3": 151.5, "r_y3": 645.8, "coord_origin": "TOPLEFT" }, "text": "table recognition. In: 2019 International Conference on Document Analysis and", "orig": "table recognition. In: 2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 664.9, "r_x1": 350.1, "r_y1": 664.9, "r_x2": 350.1, "r_y2": 656.8, "r_x3": 151.5, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific table recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 894-901. IEEE (2019)" } ], "body": [ { "label": "section_header", "id": 8, "page_no": 11, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 134.8, "t": 117.5, "r": 219.3, "b": 128.1, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 128.1, "r_x1": 141.5, "r_y1": 128.1, "r_x2": 141.5, "r_y2": 117.5, "r_x3": 134.8, "r_y3": 117.5, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.9, "r_y0": 128.1, "r_x1": 219.3, "r_y1": 128.1, "r_x2": 219.3, "r_y2": 117.5, "r_x3": 154.9, "r_y3": 117.5, "coord_origin": "TOPLEFT" }, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6 Conclusion" }, { "label": "text", "id": 2, "page_no": 11, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.8, "t": 146.9, "r": 480.6, "b": 203.5, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 155.7, "r_x1": 480.6, "r_y1": 155.7, "r_x2": 480.6, "r_y2": 146.9, "r_x3": 134.8, "r_y3": 146.9, "coord_origin": "TOPLEFT" }, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 167.6, "r_x1": 480.6, "r_y1": 167.6, "r_x2": 480.6, "r_y2": 158.8, "r_x3": 134.8, "r_y3": 158.8, "coord_origin": "TOPLEFT" }, "text": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "orig": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 179.6, "r_x1": 480.6, "r_y1": 179.6, "r_x2": 480.6, "r_y2": 170.8, "r_x3": 134.8, "r_y3": 170.8, "coord_origin": "TOPLEFT" }, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 191.5, "r_x1": 480.6, "r_y1": 191.5, "r_x2": 480.6, "r_y2": 182.7, "r_x3": 134.8, "r_y3": 182.7, "coord_origin": "TOPLEFT" }, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 203.5, "r_x1": 239.5, "r_y1": 203.5, "r_x2": 239.5, "r_y2": 194.7, "r_x3": 134.8, "r_y3": 194.7, "coord_origin": "TOPLEFT" }, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We demonstrated that representing tables in HTML for the task of table structure recognition with Im2Seq models is ill-suited and has serious limitations. Furthermore, we presented in this paper an Optimized Table Structure Language (OTSL) which, when compared to commonly used general purpose languages, has several key benefits." }, { "label": "text", "id": 0, "page_no": 11, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.8, "t": 207.4, "r": 480.6, "b": 323.8, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 216.2, "r_x1": 480.6, "r_y1": 216.2, "r_x2": 480.6, "r_y2": 207.4, "r_x3": 149.7, "r_y3": 207.4, "coord_origin": "TOPLEFT" }, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 228.2, "r_x1": 480.6, "r_y1": 228.2, "r_x2": 480.6, "r_y2": 219.4, "r_x3": 134.8, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 240.2, "r_x1": 480.6, "r_y1": 240.2, "r_x2": 480.6, "r_y2": 231.4, "r_x3": 134.8, "r_y3": 231.4, "coord_origin": "TOPLEFT" }, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 252.1, "r_x1": 480.6, "r_y1": 252.1, "r_x2": 480.6, "r_y2": 243.3, "r_x3": 134.8, "r_y3": 243.3, "coord_origin": "TOPLEFT" }, "text": "OTSL representation. Additional performance benefits can be obtained with", "orig": "OTSL representation. Additional performance benefits can be obtained with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 264.1, "r_x1": 480.6, "r_y1": 264.1, "r_x2": 480.6, "r_y2": 255.3, "r_x3": 134.8, "r_y3": 255.3, "coord_origin": "TOPLEFT" }, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 276.0, "r_x1": 480.6, "r_y1": 276.0, "r_x2": 480.6, "r_y2": 267.2, "r_x3": 134.8, "r_y3": 267.2, "coord_origin": "TOPLEFT" }, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 288.0, "r_x1": 480.6, "r_y1": 288.0, "r_x2": 480.6, "r_y2": 279.2, "r_x3": 134.8, "r_y3": 279.2, "coord_origin": "TOPLEFT" }, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 299.9, "r_x1": 480.6, "r_y1": 299.9, "r_x2": 480.6, "r_y2": 291.1, "r_x3": 134.8, "r_y3": 291.1, "coord_origin": "TOPLEFT" }, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 311.9, "r_x1": 480.6, "r_y1": 311.9, "r_x2": 480.6, "r_y2": 303.1, "r_x3": 134.8, "r_y3": 303.1, "coord_origin": "TOPLEFT" }, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 323.8, "r_x1": 240.9, "r_y1": 323.8, "r_x2": 240.9, "r_y2": 315.0, "r_x3": 134.8, "r_y3": 315.0, "coord_origin": "TOPLEFT" }, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "First and foremost, given the same network configuration, inference time for a table-structure prediction is about 2 times faster compared to the conventional HTML approach. This is primarily owed to the shorter sequence length of the OTSL representation. Additional performance benefits can be obtained with HPO (hyper parameter optimization). As we demonstrate in our experiments, models trained on OTSL can be significantly smaller, e.g. by reducing the number of encoder and decoder layers, while preserving comparatively good prediction quality. This can further improve inference performance, yielding 5-6 times faster inference speed in OTSL with prediction quality comparable to models trained on HTML (see Table 1)." }, { "label": "text", "id": 1, "page_no": 11, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.8, "t": 327.8, "r": 480.6, "b": 468.1, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.7, "r_y0": 336.6, "r_x1": 480.6, "r_y1": 336.6, "r_x2": 480.6, "r_y2": 327.8, "r_x3": 149.7, "r_y3": 327.8, "coord_origin": "TOPLEFT" }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 348.6, "r_x1": 480.6, "r_y1": 348.6, "r_x2": 480.6, "r_y2": 339.8, "r_x3": 134.8, "r_y3": 339.8, "coord_origin": "TOPLEFT" }, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 360.5, "r_x1": 480.6, "r_y1": 360.5, "r_x2": 480.6, "r_y2": 351.7, "r_x3": 134.8, "r_y3": 351.7, "coord_origin": "TOPLEFT" }, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 372.5, "r_x1": 480.6, "r_y1": 372.5, "r_x2": 480.6, "r_y2": 363.7, "r_x3": 134.8, "r_y3": 363.7, "coord_origin": "TOPLEFT" }, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 384.4, "r_x1": 480.6, "r_y1": 384.4, "r_x2": 480.6, "r_y2": 375.6, "r_x3": 134.8, "r_y3": 375.6, "coord_origin": "TOPLEFT" }, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 396.4, "r_x1": 480.6, "r_y1": 396.4, "r_x2": 480.6, "r_y2": 387.6, "r_x3": 134.8, "r_y3": 387.6, "coord_origin": "TOPLEFT" }, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 408.3, "r_x1": 480.6, "r_y1": 408.3, "r_x2": 480.6, "r_y2": 399.5, "r_x3": 134.8, "r_y3": 399.5, "coord_origin": "TOPLEFT" }, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 420.3, "r_x1": 480.6, "r_y1": 420.3, "r_x2": 480.6, "r_y2": 411.5, "r_x3": 134.8, "r_y3": 411.5, "coord_origin": "TOPLEFT" }, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 432.2, "r_x1": 480.6, "r_y1": 432.2, "r_x2": 480.6, "r_y2": 423.4, "r_x3": 134.8, "r_y3": 423.4, "coord_origin": "TOPLEFT" }, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 444.2, "r_x1": 480.6, "r_y1": 444.2, "r_x2": 480.6, "r_y2": 435.4, "r_x3": 134.8, "r_y3": 435.4, "coord_origin": "TOPLEFT" }, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 456.1, "r_x1": 480.6, "r_y1": 456.1, "r_x2": 480.6, "r_y2": 447.4, "r_x3": 134.8, "r_y3": 447.4, "coord_origin": "TOPLEFT" }, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 468.1, "r_x1": 366.8, "r_y1": 468.1, "r_x2": 366.8, "r_y2": 459.3, "r_x3": 134.8, "r_y3": 459.3, "coord_origin": "TOPLEFT" }, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vocabulary size. This allows autoregressive models to perform better in the TED metric, but especially with regards to prediction accuracy of the table-cell bounding boxes (see Table 2). As shown in Figure 5, we observe that the OTSL drastically reduces the drift for table cell bounding boxes at high row count and in sparse tables. This leads to more accurate predictions and a significant reduction in post-processing complexity, which is an undesired necessity in HTML-based Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few, simple and always backwards looking. Each new token can be validated only by analyzing the sequence of previous tokens, without requiring the entire sequence to detect mistakes. This in return allows to perform structural error detection and correction on-the-fly during sequence generation." }, { "label": "section_header", "id": 7, "page_no": 11, "cluster": { "id": 7, "label": "section_header", "bbox": { "l": 134.8, "t": 493.8, "r": 197.7, "b": 504.4, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 504.4, "r_x1": 197.7, "r_y1": 504.4, "r_x2": 197.7, "r_y2": 493.8, "r_x3": 134.8, "r_y3": 493.8, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "References" }, { "label": "list_item", "id": 5, "page_no": 11, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.4, "t": 522.9, "r": 480.6, "b": 563.9, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 530.9, "r_x1": 146.5, "r_y1": 530.9, "r_x2": 146.5, "r_y2": 522.9, "r_x3": 139.4, "r_y3": 522.9, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.0, "r_y0": 530.9, "r_x1": 480.6, "r_y1": 530.9, "r_x2": 480.6, "r_y2": 522.9, "r_x3": 151.0, "r_y3": 522.9, "coord_origin": "TOPLEFT" }, "text": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "orig": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 541.9, "r_x1": 480.6, "r_y1": 541.9, "r_x2": 480.6, "r_y2": 533.8, "r_x3": 151.5, "r_y3": 533.8, "coord_origin": "TOPLEFT" }, "text": "ument conversion as a cloud service with high throughput and responsiveness.", "orig": "ument conversion as a cloud service with high throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 552.9, "r_x1": 176.3, "r_y1": 552.9, "r_x2": 176.3, "r_y2": 544.8, "r_x3": 151.5, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.5, "r_y0": 552.7, "r_x1": 250.7, "r_y1": 552.7, "r_x2": 250.7, "r_y2": 544.7, "r_x3": 179.5, "r_y3": 544.7, "coord_origin": "TOPLEFT" }, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.8, "r_y0": 552.9, "r_x1": 282.0, "r_y1": 552.9, "r_x2": 282.0, "r_y2": 544.8, "r_x3": 253.8, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.1, "r_y0": 552.9, "r_x1": 478.0, "r_y1": 552.9, "r_x2": 478.0, "r_y2": 545.4, "r_x3": 285.1, "r_y3": 545.4, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0, "r_y0": 552.9, "r_x1": 480.6, "r_y1": 552.9, "r_x2": 480.6, "r_y2": 544.8, "r_x3": 478.0, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 563.9, "r_x1": 344.5, "r_y1": 563.9, "r_x2": 344.5, "r_y2": 556.4, "r_x3": 151.5, "r_y3": 556.4, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering document conversion as a cloud service with high throughput and responsiveness. CoRR abs/2206.00785 (2022). https://doi.org/10.48550/arXiv.2206.00785 , https://doi.org/10.48550/arXiv.2206.00785" }, { "label": "list_item", "id": 4, "page_no": 11, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.4, "t": 567.5, "r": 480.6, "b": 608.5, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 575.6, "r_x1": 145.9, "r_y1": 575.6, "r_x2": 145.9, "r_y2": 567.5, "r_x3": 139.4, "r_y3": 567.5, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.2, "r_y0": 575.6, "r_x1": 480.6, "r_y1": 575.6, "r_x2": 480.6, "r_y2": 567.5, "r_x3": 150.2, "r_y3": 567.5, "coord_origin": "TOPLEFT" }, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 586.5, "r_x1": 480.6, "r_y1": 586.5, "r_x2": 480.6, "r_y2": 578.5, "r_x3": 151.5, "r_y3": 578.5, "coord_origin": "TOPLEFT" }, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 597.5, "r_x1": 480.6, "r_y1": 597.5, "r_x2": 480.6, "r_y2": 589.4, "r_x3": 151.5, "r_y3": 589.4, "coord_origin": "TOPLEFT" }, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 608.5, "r_x1": 364.2, "r_y1": 608.5, "r_x2": 364.2, "r_y2": 600.4, "r_x3": 151.5, "r_y3": 600.4, "coord_origin": "TOPLEFT" }, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition in the wild using transformer and identity matrix-based augmentation. In: Porwal, U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545561. Springer International Publishing, Cham (2022)" }, { "label": "list_item", "id": 6, "page_no": 11, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 139.4, "t": 612.2, "r": 480.6, "b": 631.2, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 620.2, "r_x1": 146.4, "r_y1": 620.2, "r_x2": 146.4, "r_y2": 612.2, "r_x3": 139.4, "r_y3": 612.2, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.0, "r_y0": 620.2, "r_x1": 480.6, "r_y1": 620.2, "r_x2": 480.6, "r_y2": 612.2, "r_x3": 151.0, "r_y3": 612.2, "coord_origin": "TOPLEFT" }, "text": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 631.2, "r_x1": 400.2, "r_y1": 631.2, "r_x2": 400.2, "r_y2": 623.1, "r_x3": 151.5, "r_y3": 623.1, "coord_origin": "TOPLEFT" }, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table structure recognition. arXiv preprint arXiv:1908.04729 (2019)" }, { "label": "list_item", "id": 3, "page_no": 11, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 139.4, "t": 634.9, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 643.0, "r_x1": 146.5, "r_y1": 643.0, "r_x2": 146.5, "r_y2": 634.9, "r_x3": 139.4, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.1, "r_y0": 643.0, "r_x1": 480.6, "r_y1": 643.0, "r_x2": 480.6, "r_y2": 634.9, "r_x3": 151.1, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "orig": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 653.9, "r_x1": 480.6, "r_y1": 653.9, "r_x2": 480.6, "r_y2": 645.8, "r_x3": 151.5, "r_y3": 645.8, "coord_origin": "TOPLEFT" }, "text": "table recognition. In: 2019 International Conference on Document Analysis and", "orig": "table recognition. In: 2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 664.9, "r_x1": 350.1, "r_y1": 664.9, "r_x2": 350.1, "r_y2": 656.8, "r_x3": 151.5, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific table recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 894-901. IEEE (2019)" } ], "headers": [ { "label": "page_header", "id": 10, "page_no": 11, "cluster": { "id": 10, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 144.0, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.86, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 144.0, "r_y1": 101.8, "r_x2": 144.0, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12" }, { "label": "page_header", "id": 9, "page_no": 11, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 12, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.4, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 471.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 127.7, "r_x1": 146.0, "r_y1": 127.7, "r_x2": 146.0, "r_y2": 119.7, "r_x3": 139.4, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.3, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 119.7, "r_x3": 150.3, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 138.7, "r_x1": 480.6, "r_y1": 138.7, "r_x2": 480.6, "r_y2": 130.6, "r_x3": 151.5, "r_y3": 130.6, "coord_origin": "TOPLEFT" }, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 149.7, "r_x1": 304.0, "r_y1": 149.7, "r_x2": 304.0, "r_y2": 141.6, "r_x3": 151.5, "r_y3": 141.6, "coord_origin": "TOPLEFT" }, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 160.6, "r_x1": 145.9, "r_y1": 160.6, "r_x2": 145.9, "r_y2": 152.6, "r_x3": 139.4, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.2, "r_y0": 160.6, "r_x1": 480.6, "r_y1": 160.6, "r_x2": 480.6, "r_y2": 152.6, "r_x3": 150.2, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 171.6, "r_x1": 480.6, "r_y1": 171.6, "r_x2": 480.6, "r_y2": 163.5, "r_x3": 151.5, "r_y3": 163.5, "coord_origin": "TOPLEFT" }, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 182.5, "r_x1": 480.6, "r_y1": 182.5, "r_x2": 480.6, "r_y2": 174.5, "r_x3": 151.5, "r_y3": 174.5, "coord_origin": "TOPLEFT" }, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 193.5, "r_x1": 226.4, "r_y1": 193.5, "r_x2": 226.4, "r_y2": 185.4, "r_x3": 151.5, "r_y3": 185.4, "coord_origin": "TOPLEFT" }, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 204.5, "r_x1": 146.3, "r_y1": 204.5, "r_x2": 146.3, "r_y2": 196.4, "r_x3": 139.4, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.8, "r_y0": 204.5, "r_x1": 480.6, "r_y1": 204.5, "r_x2": 480.6, "r_y2": 196.4, "r_x3": 150.8, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 215.4, "r_x1": 352.0, "r_y1": 215.4, "r_x2": 352.0, "r_y2": 207.4, "r_x3": 151.5, "r_y3": 207.4, "coord_origin": "TOPLEFT" }, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 226.4, "r_x1": 146.4, "r_y1": 226.4, "r_x2": 146.4, "r_y2": 218.3, "r_x3": 139.4, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 226.4, "r_x1": 480.6, "r_y1": 226.4, "r_x2": 480.6, "r_y2": 218.3, "r_x3": 150.9, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 237.4, "r_x1": 480.6, "r_y1": 237.4, "r_x2": 480.6, "r_y2": 229.3, "r_x3": 151.5, "r_y3": 229.3, "coord_origin": "TOPLEFT" }, "text": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 248.3, "r_x1": 480.6, "r_y1": 248.3, "r_x2": 480.6, "r_y2": 240.3, "r_x3": 151.5, "r_y3": 240.3, "coord_origin": "TOPLEFT" }, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 259.3, "r_x1": 197.1, "r_y1": 259.3, "r_x2": 197.1, "r_y2": 251.2, "r_x3": 151.5, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.4, "r_y0": 259.1, "r_x1": 210.0, "r_y1": 259.1, "r_x2": 210.0, "r_y2": 251.2, "r_x3": 199.4, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.0, "r_y0": 259.3, "r_x1": 332.4, "r_y1": 259.3, "r_x2": 332.4, "r_y2": 251.2, "r_x3": 210.0, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.7, "r_y0": 259.3, "r_x1": 480.6, "r_y1": 259.3, "r_x2": 480.6, "r_y2": 251.9, "r_x3": 334.7, "r_y3": 251.9, "coord_origin": "TOPLEFT" }, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 270.3, "r_x1": 259.8, "r_y1": 270.3, "r_x2": 259.8, "r_y2": 262.8, "r_x3": 151.5, "r_y3": 262.8, "coord_origin": "TOPLEFT" }, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 281.2, "r_x1": 146.1, "r_y1": 281.2, "r_x2": 146.1, "r_y2": 273.1, "r_x3": 139.4, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 281.2, "r_x1": 480.6, "r_y1": 281.2, "r_x2": 480.6, "r_y2": 273.1, "r_x3": 150.5, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 292.2, "r_x1": 480.6, "r_y1": 292.2, "r_x2": 480.6, "r_y2": 284.1, "r_x3": 151.5, "r_y3": 284.1, "coord_origin": "TOPLEFT" }, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 303.1, "r_x1": 473.4, "r_y1": 303.1, "r_x2": 473.4, "r_y2": 295.1, "r_x3": 151.5, "r_y3": 295.1, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 314.1, "r_x1": 146.5, "r_y1": 314.1, "r_x2": 146.5, "r_y2": 306.0, "r_x3": 134.8, "r_y3": 306.0, "coord_origin": "TOPLEFT" }, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.1, "r_y0": 314.1, "r_x1": 480.6, "r_y1": 314.1, "r_x2": 480.6, "r_y2": 306.0, "r_x3": 151.1, "r_y3": 306.0, "coord_origin": "TOPLEFT" }, "text": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "orig": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 325.1, "r_x1": 480.6, "r_y1": 325.1, "r_x2": 480.6, "r_y2": 317.0, "r_x3": 151.5, "r_y3": 317.0, "coord_origin": "TOPLEFT" }, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 336.0, "r_x1": 480.6, "r_y1": 336.0, "r_x2": 480.6, "r_y2": 328.0, "r_x3": 151.5, "r_y3": 328.0, "coord_origin": "TOPLEFT" }, "text": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 347.0, "r_x1": 480.6, "r_y1": 347.0, "r_x2": 480.6, "r_y2": 338.9, "r_x3": 151.5, "r_y3": 338.9, "coord_origin": "TOPLEFT" }, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 357.9, "r_x1": 251.1, "r_y1": 357.9, "r_x2": 251.1, "r_y2": 349.9, "r_x3": 151.5, "r_y3": 349.9, "coord_origin": "TOPLEFT" }, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 254.0, "r_y0": 358.0, "r_x1": 437.5, "r_y1": 358.0, "r_x2": 437.5, "r_y2": 350.5, "r_x3": 254.0, "r_y3": 350.5, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.5, "r_y0": 357.9, "r_x1": 440.1, "r_y1": 357.9, "r_x2": 440.1, "r_y2": 349.9, "r_x3": 437.5, "r_y3": 349.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.9, "r_y0": 358.0, "r_x1": 480.6, "r_y1": 358.0, "r_x2": 480.6, "r_y2": 350.5, "r_x3": 442.9, "r_y3": 350.5, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 368.9, "r_x1": 297.4, "r_y1": 368.9, "r_x2": 297.4, "r_y2": 361.5, "r_x3": 151.5, "r_y3": 361.5, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 379.9, "r_x1": 146.0, "r_y1": 379.9, "r_x2": 146.0, "r_y2": 371.8, "r_x3": 134.8, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 379.9, "r_x1": 480.6, "r_y1": 379.9, "r_x2": 480.6, "r_y2": 371.8, "r_x3": 150.5, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 390.8, "r_x1": 480.6, "r_y1": 390.8, "r_x2": 480.6, "r_y2": 382.8, "r_x3": 151.5, "r_y3": 382.8, "coord_origin": "TOPLEFT" }, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 401.8, "r_x1": 480.6, "r_y1": 401.8, "r_x2": 480.6, "r_y2": 393.7, "r_x3": 151.5, "r_y3": 393.7, "coord_origin": "TOPLEFT" }, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 412.7, "r_x1": 373.8, "r_y1": 412.7, "r_x2": 373.8, "r_y2": 404.7, "r_x3": 151.5, "r_y3": 404.7, "coord_origin": "TOPLEFT" }, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 423.7, "r_x1": 145.9, "r_y1": 423.7, "r_x2": 145.9, "r_y2": 415.6, "r_x3": 134.8, "r_y3": 415.6, "coord_origin": "TOPLEFT" }, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.3, "r_y0": 423.7, "r_x1": 480.6, "r_y1": 423.7, "r_x2": 480.6, "r_y2": 415.6, "r_x3": 150.3, "r_y3": 415.6, "coord_origin": "TOPLEFT" }, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 434.7, "r_x1": 480.6, "r_y1": 434.7, "r_x2": 480.6, "r_y2": 426.6, "r_x3": 151.5, "r_y3": 426.6, "coord_origin": "TOPLEFT" }, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 445.6, "r_x1": 480.6, "r_y1": 445.6, "r_x2": 480.6, "r_y2": 437.6, "r_x3": 151.5, "r_y3": 437.6, "coord_origin": "TOPLEFT" }, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 456.6, "r_x1": 292.9, "r_y1": 456.6, "r_x2": 292.9, "r_y2": 448.5, "r_x3": 151.5, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 467.6, "r_x1": 145.8, "r_y1": 467.6, "r_x2": 145.8, "r_y2": 459.5, "r_x3": 134.8, "r_y3": 459.5, "coord_origin": "TOPLEFT" }, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.1, "r_y0": 467.6, "r_x1": 480.6, "r_y1": 467.6, "r_x2": 480.6, "r_y2": 459.5, "r_x3": 150.1, "r_y3": 459.5, "coord_origin": "TOPLEFT" }, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 478.5, "r_x1": 480.6, "r_y1": 478.5, "r_x2": 480.6, "r_y2": 470.5, "r_x3": 151.5, "r_y3": 470.5, "coord_origin": "TOPLEFT" }, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 489.5, "r_x1": 439.1, "r_y1": 489.5, "r_x2": 439.1, "r_y2": 481.4, "r_x3": 151.5, "r_y3": 481.4, "coord_origin": "TOPLEFT" }, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.9, "r_y0": 489.5, "r_x1": 480.6, "r_y1": 489.5, "r_x2": 480.6, "r_y2": 482.1, "r_x3": 442.9, "r_y3": 482.1, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 500.5, "r_x1": 302.1, "r_y1": 500.5, "r_x2": 302.1, "r_y2": 493.0, "r_x3": 151.5, "r_y3": 493.0, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 511.4, "r_x1": 146.2, "r_y1": 511.4, "r_x2": 146.2, "r_y2": 503.3, "r_x3": 134.8, "r_y3": 503.3, "coord_origin": "TOPLEFT" }, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.6, "r_y0": 511.4, "r_x1": 480.6, "r_y1": 511.4, "r_x2": 480.6, "r_y2": 503.3, "r_x3": 150.6, "r_y3": 503.3, "coord_origin": "TOPLEFT" }, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 522.4, "r_x1": 480.6, "r_y1": 522.4, "r_x2": 480.6, "r_y2": 514.3, "r_x3": 151.5, "r_y3": 514.3, "coord_origin": "TOPLEFT" }, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 525.3, "r_x3": 151.5, "r_y3": 525.3, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 544.3, "r_x1": 199.2, "r_y1": 544.3, "r_x2": 199.2, "r_y2": 536.2, "r_x3": 151.5, "r_y3": 536.2, "coord_origin": "TOPLEFT" }, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 555.3, "r_x1": 146.2, "r_y1": 555.3, "r_x2": 146.2, "r_y2": 547.2, "r_x3": 134.8, "r_y3": 547.2, "coord_origin": "TOPLEFT" }, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.6, "r_y0": 555.3, "r_x1": 480.6, "r_y1": 555.3, "r_x2": 480.6, "r_y2": 547.2, "r_x3": 150.6, "r_y3": 547.2, "coord_origin": "TOPLEFT" }, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 566.2, "r_x1": 480.6, "r_y1": 566.2, "r_x2": 480.6, "r_y2": 558.1, "r_x3": 151.5, "r_y3": 558.1, "coord_origin": "TOPLEFT" }, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 577.2, "r_x1": 480.6, "r_y1": 577.2, "r_x2": 480.6, "r_y2": 569.1, "r_x3": 151.5, "r_y3": 569.1, "coord_origin": "TOPLEFT" }, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 588.1, "r_x1": 480.6, "r_y1": 588.1, "r_x2": 480.6, "r_y2": 580.1, "r_x3": 151.5, "r_y3": 580.1, "coord_origin": "TOPLEFT" }, "text": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 599.1, "r_x1": 200.8, "r_y1": 599.1, "r_x2": 200.8, "r_y2": 591.0, "r_x3": 151.5, "r_y3": 591.0, "coord_origin": "TOPLEFT" }, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 202.9, "r_y0": 599.1, "r_x1": 386.5, "r_y1": 599.1, "r_x2": 386.5, "r_y2": 591.7, "r_x3": 202.9, "r_y3": 591.7, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.5, "r_y0": 599.1, "r_x1": 389.0, "r_y1": 599.1, "r_x2": 389.0, "r_y2": 591.0, "r_x3": 386.5, "r_y3": 591.0, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.2, "r_y0": 599.1, "r_x1": 480.6, "r_y1": 599.1, "r_x2": 480.6, "r_y2": 591.7, "r_x3": 391.2, "r_y3": 591.7, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 610.1, "r_x1": 245.6, "r_y1": 610.1, "r_x2": 245.6, "r_y2": 602.6, "r_x3": 151.5, "r_y3": 602.6, "coord_origin": "TOPLEFT" }, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 621.0, "r_x1": 146.6, "r_y1": 621.0, "r_x2": 146.6, "r_y2": 613.0, "r_x3": 134.8, "r_y3": 613.0, "coord_origin": "TOPLEFT" }, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.3, "r_y0": 621.0, "r_x1": 480.6, "r_y1": 621.0, "r_x2": 480.6, "r_y2": 613.0, "r_x3": 151.3, "r_y3": 613.0, "coord_origin": "TOPLEFT" }, "text": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "orig": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 632.0, "r_x1": 234.4, "r_y1": 632.0, "r_x2": 234.4, "r_y2": 623.9, "r_x3": 151.5, "r_y3": 623.9, "coord_origin": "TOPLEFT" }, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 642.9, "r_x1": 146.3, "r_y1": 642.9, "r_x2": 146.3, "r_y2": 634.9, "r_x3": 134.8, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.8, "r_y0": 642.9, "r_x1": 480.6, "r_y1": 642.9, "r_x2": 480.6, "r_y2": 634.9, "r_x3": 150.8, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 653.9, "r_x1": 480.6, "r_y1": 653.9, "r_x2": 480.6, "r_y2": 645.8, "r_x3": 151.5, "r_y3": 645.8, "coord_origin": "TOPLEFT" }, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 664.9, "r_x1": 299.3, "r_y1": 664.9, "r_x2": 299.3, "r_y2": 656.8, "r_x3": 151.5, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 13, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "page_header", "bbox": { "l": 471.4, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.91, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.4, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 471.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 139.4, "t": 119.7, "r": 480.6, "b": 149.7, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 127.7, "r_x1": 146.0, "r_y1": 127.7, "r_x2": 146.0, "r_y2": 119.7, "r_x3": 139.4, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.3, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 119.7, "r_x3": 150.3, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 138.7, "r_x1": 480.6, "r_y1": 138.7, "r_x2": 480.6, "r_y2": 130.6, "r_x3": 151.5, "r_y3": 130.6, "coord_origin": "TOPLEFT" }, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 149.7, "r_x1": 304.0, "r_y1": 149.7, "r_x2": 304.0, "r_y2": 141.6, "r_x3": 151.5, "r_y3": 141.6, "coord_origin": "TOPLEFT" }, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "list_item", "bbox": { "l": 139.4, "t": 152.6, "r": 480.6, "b": 193.5, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 160.6, "r_x1": 145.9, "r_y1": 160.6, "r_x2": 145.9, "r_y2": 152.6, "r_x3": 139.4, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.2, "r_y0": 160.6, "r_x1": 480.6, "r_y1": 160.6, "r_x2": 480.6, "r_y2": 152.6, "r_x3": 150.2, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 171.6, "r_x1": 480.6, "r_y1": 171.6, "r_x2": 480.6, "r_y2": 163.5, "r_x3": 151.5, "r_y3": 163.5, "coord_origin": "TOPLEFT" }, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 182.5, "r_x1": 480.6, "r_y1": 182.5, "r_x2": 480.6, "r_y2": 174.5, "r_x3": 151.5, "r_y3": 174.5, "coord_origin": "TOPLEFT" }, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 193.5, "r_x1": 226.4, "r_y1": 193.5, "r_x2": 226.4, "r_y2": 185.4, "r_x3": 151.5, "r_y3": 185.4, "coord_origin": "TOPLEFT" }, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 139.4, "t": 196.4, "r": 480.6, "b": 215.4, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 204.5, "r_x1": 146.3, "r_y1": 204.5, "r_x2": 146.3, "r_y2": 196.4, "r_x3": 139.4, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.8, "r_y0": 204.5, "r_x1": 480.6, "r_y1": 204.5, "r_x2": 480.6, "r_y2": 196.4, "r_x3": 150.8, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 215.4, "r_x1": 352.0, "r_y1": 215.4, "r_x2": 352.0, "r_y2": 207.4, "r_x3": 151.5, "r_y3": 207.4, "coord_origin": "TOPLEFT" }, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 139.4, "t": 218.3, "r": 480.6, "b": 270.3, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 226.4, "r_x1": 146.4, "r_y1": 226.4, "r_x2": 146.4, "r_y2": 218.3, "r_x3": 139.4, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 226.4, "r_x1": 480.6, "r_y1": 226.4, "r_x2": 480.6, "r_y2": 218.3, "r_x3": 150.9, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 237.4, "r_x1": 480.6, "r_y1": 237.4, "r_x2": 480.6, "r_y2": 229.3, "r_x3": 151.5, "r_y3": 229.3, "coord_origin": "TOPLEFT" }, "text": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 248.3, "r_x1": 480.6, "r_y1": 248.3, "r_x2": 480.6, "r_y2": 240.3, "r_x3": 151.5, "r_y3": 240.3, "coord_origin": "TOPLEFT" }, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 259.3, "r_x1": 197.1, "r_y1": 259.3, "r_x2": 197.1, "r_y2": 251.2, "r_x3": 151.5, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.4, "r_y0": 259.1, "r_x1": 210.0, "r_y1": 259.1, "r_x2": 210.0, "r_y2": 251.2, "r_x3": 199.4, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.0, "r_y0": 259.3, "r_x1": 332.4, "r_y1": 259.3, "r_x2": 332.4, "r_y2": 251.2, "r_x3": 210.0, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.7, "r_y0": 259.3, "r_x1": 480.6, "r_y1": 259.3, "r_x2": 480.6, "r_y2": 251.9, "r_x3": 334.7, "r_y3": 251.9, "coord_origin": "TOPLEFT" }, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 270.3, "r_x1": 259.8, "r_y1": 270.3, "r_x2": 259.8, "r_y2": 262.8, "r_x3": 151.5, "r_y3": 262.8, "coord_origin": "TOPLEFT" }, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "list_item", "bbox": { "l": 139.4, "t": 273.1, "r": 480.6, "b": 303.1, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 281.2, "r_x1": 146.1, "r_y1": 281.2, "r_x2": 146.1, "r_y2": 273.1, "r_x3": 139.4, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 281.2, "r_x1": 480.6, "r_y1": 281.2, "r_x2": 480.6, "r_y2": 273.1, "r_x3": 150.5, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 292.2, "r_x1": 480.6, "r_y1": 292.2, "r_x2": 480.6, "r_y2": 284.1, "r_x3": 151.5, "r_y3": 284.1, "coord_origin": "TOPLEFT" }, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 303.1, "r_x1": 473.4, "r_y1": 303.1, "r_x2": 473.4, "r_y2": 295.1, "r_x3": 151.5, "r_y3": 295.1, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 134.8, "t": 306.0, "r": 480.6, "b": 368.9, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 314.1, "r_x1": 146.5, "r_y1": 314.1, "r_x2": 146.5, "r_y2": 306.0, "r_x3": 134.8, "r_y3": 306.0, "coord_origin": "TOPLEFT" }, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.1, "r_y0": 314.1, "r_x1": 480.6, "r_y1": 314.1, "r_x2": 480.6, "r_y2": 306.0, "r_x3": 151.1, "r_y3": 306.0, "coord_origin": "TOPLEFT" }, "text": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "orig": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 325.1, "r_x1": 480.6, "r_y1": 325.1, "r_x2": 480.6, "r_y2": 317.0, "r_x3": 151.5, "r_y3": 317.0, "coord_origin": "TOPLEFT" }, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 336.0, "r_x1": 480.6, "r_y1": 336.0, "r_x2": 480.6, "r_y2": 328.0, "r_x3": 151.5, "r_y3": 328.0, "coord_origin": "TOPLEFT" }, "text": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 347.0, "r_x1": 480.6, "r_y1": 347.0, "r_x2": 480.6, "r_y2": 338.9, "r_x3": 151.5, "r_y3": 338.9, "coord_origin": "TOPLEFT" }, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 357.9, "r_x1": 251.1, "r_y1": 357.9, "r_x2": 251.1, "r_y2": 349.9, "r_x3": 151.5, "r_y3": 349.9, "coord_origin": "TOPLEFT" }, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 254.0, "r_y0": 358.0, "r_x1": 437.5, "r_y1": 358.0, "r_x2": 437.5, "r_y2": 350.5, "r_x3": 254.0, "r_y3": 350.5, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.5, "r_y0": 357.9, "r_x1": 440.1, "r_y1": 357.9, "r_x2": 440.1, "r_y2": 349.9, "r_x3": 437.5, "r_y3": 349.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.9, "r_y0": 358.0, "r_x1": 480.6, "r_y1": 358.0, "r_x2": 480.6, "r_y2": 350.5, "r_x3": 442.9, "r_y3": 350.5, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 368.9, "r_x1": 297.4, "r_y1": 368.9, "r_x2": 297.4, "r_y2": 361.5, "r_x3": 151.5, "r_y3": 361.5, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "list_item", "bbox": { "l": 134.8, "t": 371.8, "r": 480.6, "b": 412.7, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 379.9, "r_x1": 146.0, "r_y1": 379.9, "r_x2": 146.0, "r_y2": 371.8, "r_x3": 134.8, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 379.9, "r_x1": 480.6, "r_y1": 379.9, "r_x2": 480.6, "r_y2": 371.8, "r_x3": 150.5, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 390.8, "r_x1": 480.6, "r_y1": 390.8, "r_x2": 480.6, "r_y2": 382.8, "r_x3": 151.5, "r_y3": 382.8, "coord_origin": "TOPLEFT" }, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 401.8, "r_x1": 480.6, "r_y1": 401.8, "r_x2": 480.6, "r_y2": 393.7, "r_x3": 151.5, "r_y3": 393.7, "coord_origin": "TOPLEFT" }, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 412.7, "r_x1": 373.8, "r_y1": 412.7, "r_x2": 373.8, "r_y2": 404.7, "r_x3": 151.5, "r_y3": 404.7, "coord_origin": "TOPLEFT" }, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 134.8, "t": 415.6, "r": 480.6, "b": 456.6, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 423.7, "r_x1": 145.9, "r_y1": 423.7, "r_x2": 145.9, "r_y2": 415.6, "r_x3": 134.8, "r_y3": 415.6, "coord_origin": "TOPLEFT" }, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.3, "r_y0": 423.7, "r_x1": 480.6, "r_y1": 423.7, "r_x2": 480.6, "r_y2": 415.6, "r_x3": 150.3, "r_y3": 415.6, "coord_origin": "TOPLEFT" }, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 434.7, "r_x1": 480.6, "r_y1": 434.7, "r_x2": 480.6, "r_y2": 426.6, "r_x3": 151.5, "r_y3": 426.6, "coord_origin": "TOPLEFT" }, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 445.6, "r_x1": 480.6, "r_y1": 445.6, "r_x2": 480.6, "r_y2": 437.6, "r_x3": 151.5, "r_y3": 437.6, "coord_origin": "TOPLEFT" }, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 456.6, "r_x1": 292.9, "r_y1": 456.6, "r_x2": 292.9, "r_y2": 448.5, "r_x3": 151.5, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "list_item", "bbox": { "l": 134.8, "t": 459.5, "r": 480.6, "b": 500.5, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 467.6, "r_x1": 145.8, "r_y1": 467.6, "r_x2": 145.8, "r_y2": 459.5, "r_x3": 134.8, "r_y3": 459.5, "coord_origin": "TOPLEFT" }, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.1, "r_y0": 467.6, "r_x1": 480.6, "r_y1": 467.6, "r_x2": 480.6, "r_y2": 459.5, "r_x3": 150.1, "r_y3": 459.5, "coord_origin": "TOPLEFT" }, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 478.5, "r_x1": 480.6, "r_y1": 478.5, "r_x2": 480.6, "r_y2": 470.5, "r_x3": 151.5, "r_y3": 470.5, "coord_origin": "TOPLEFT" }, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 489.5, "r_x1": 439.1, "r_y1": 489.5, "r_x2": 439.1, "r_y2": 481.4, "r_x3": 151.5, "r_y3": 481.4, "coord_origin": "TOPLEFT" }, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.9, "r_y0": 489.5, "r_x1": 480.6, "r_y1": 489.5, "r_x2": 480.6, "r_y2": 482.1, "r_x3": 442.9, "r_y3": 482.1, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 500.5, "r_x1": 302.1, "r_y1": 500.5, "r_x2": 302.1, "r_y2": 493.0, "r_x3": 151.5, "r_y3": 493.0, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "list_item", "bbox": { "l": 134.8, "t": 503.3, "r": 480.6, "b": 544.3, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 511.4, "r_x1": 146.2, "r_y1": 511.4, "r_x2": 146.2, "r_y2": 503.3, "r_x3": 134.8, "r_y3": 503.3, "coord_origin": "TOPLEFT" }, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.6, "r_y0": 511.4, "r_x1": 480.6, "r_y1": 511.4, "r_x2": 480.6, "r_y2": 503.3, "r_x3": 150.6, "r_y3": 503.3, "coord_origin": "TOPLEFT" }, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 522.4, "r_x1": 480.6, "r_y1": 522.4, "r_x2": 480.6, "r_y2": 514.3, "r_x3": 151.5, "r_y3": 514.3, "coord_origin": "TOPLEFT" }, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 525.3, "r_x3": 151.5, "r_y3": 525.3, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 544.3, "r_x1": 199.2, "r_y1": 544.3, "r_x2": 199.2, "r_y2": 536.2, "r_x3": 151.5, "r_y3": 536.2, "coord_origin": "TOPLEFT" }, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 134.8, "t": 547.2, "r": 480.6, "b": 610.1, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 555.3, "r_x1": 146.2, "r_y1": 555.3, "r_x2": 146.2, "r_y2": 547.2, "r_x3": 134.8, "r_y3": 547.2, "coord_origin": "TOPLEFT" }, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.6, "r_y0": 555.3, "r_x1": 480.6, "r_y1": 555.3, "r_x2": 480.6, "r_y2": 547.2, "r_x3": 150.6, "r_y3": 547.2, "coord_origin": "TOPLEFT" }, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 566.2, "r_x1": 480.6, "r_y1": 566.2, "r_x2": 480.6, "r_y2": 558.1, "r_x3": 151.5, "r_y3": 558.1, "coord_origin": "TOPLEFT" }, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 577.2, "r_x1": 480.6, "r_y1": 577.2, "r_x2": 480.6, "r_y2": 569.1, "r_x3": 151.5, "r_y3": 569.1, "coord_origin": "TOPLEFT" }, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 588.1, "r_x1": 480.6, "r_y1": 588.1, "r_x2": 480.6, "r_y2": 580.1, "r_x3": 151.5, "r_y3": 580.1, "coord_origin": "TOPLEFT" }, "text": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 599.1, "r_x1": 200.8, "r_y1": 599.1, "r_x2": 200.8, "r_y2": 591.0, "r_x3": 151.5, "r_y3": 591.0, "coord_origin": "TOPLEFT" }, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 202.9, "r_y0": 599.1, "r_x1": 386.5, "r_y1": 599.1, "r_x2": 386.5, "r_y2": 591.7, "r_x3": 202.9, "r_y3": 591.7, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.5, "r_y0": 599.1, "r_x1": 389.0, "r_y1": 599.1, "r_x2": 389.0, "r_y2": 591.0, "r_x3": 386.5, "r_y3": 591.0, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.2, "r_y0": 599.1, "r_x1": 480.6, "r_y1": 599.1, "r_x2": 480.6, "r_y2": 591.7, "r_x3": 391.2, "r_y3": 591.7, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 610.1, "r_x1": 245.6, "r_y1": 610.1, "r_x2": 245.6, "r_y2": 602.6, "r_x3": 151.5, "r_y3": 602.6, "coord_origin": "TOPLEFT" }, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "list_item", "bbox": { "l": 134.8, "t": 613.0, "r": 480.6, "b": 632.0, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 621.0, "r_x1": 146.6, "r_y1": 621.0, "r_x2": 146.6, "r_y2": 613.0, "r_x3": 134.8, "r_y3": 613.0, "coord_origin": "TOPLEFT" }, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.3, "r_y0": 621.0, "r_x1": 480.6, "r_y1": 621.0, "r_x2": 480.6, "r_y2": 613.0, "r_x3": 151.3, "r_y3": 613.0, "coord_origin": "TOPLEFT" }, "text": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "orig": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 632.0, "r_x1": 234.4, "r_y1": 632.0, "r_x2": 234.4, "r_y2": 623.9, "r_x3": 151.5, "r_y3": 623.9, "coord_origin": "TOPLEFT" }, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 134.8, "t": 634.9, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 642.9, "r_x1": 146.3, "r_y1": 642.9, "r_x2": 146.3, "r_y2": 634.9, "r_x3": 134.8, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.8, "r_y0": 642.9, "r_x1": 480.6, "r_y1": 642.9, "r_x2": 480.6, "r_y2": 634.9, "r_x3": 150.8, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 653.9, "r_x1": 480.6, "r_y1": 653.9, "r_x2": 480.6, "r_y2": 645.8, "r_x3": 151.5, "r_y3": 645.8, "coord_origin": "TOPLEFT" }, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 664.9, "r_x1": 299.3, "r_y1": 664.9, "r_x2": 299.3, "r_y2": 656.8, "r_x3": 151.5, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 13, "page_no": 12, "cluster": { "id": 13, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 14, "page_no": 12, "cluster": { "id": 14, "label": "page_header", "bbox": { "l": 471.4, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.91, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.4, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 471.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13" }, { "label": "list_item", "id": 5, "page_no": 12, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.4, "t": 119.7, "r": 480.6, "b": 149.7, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 127.7, "r_x1": 146.0, "r_y1": 127.7, "r_x2": 146.0, "r_y2": 119.7, "r_x3": 139.4, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.3, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 119.7, "r_x3": 150.3, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 138.7, "r_x1": 480.6, "r_y1": 138.7, "r_x2": 480.6, "r_y2": 130.6, "r_x3": 151.5, "r_y3": 130.6, "coord_origin": "TOPLEFT" }, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 149.7, "r_x1": 304.0, "r_y1": 149.7, "r_x2": 304.0, "r_y2": 141.6, "r_x3": 151.5, "r_y3": 141.6, "coord_origin": "TOPLEFT" }, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content extraction from scientific tables. International Journal on Document Analysis and Recognition (IJDAR) pp. 1-10 (2022)" }, { "label": "list_item", "id": 1, "page_no": 12, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 139.4, "t": 152.6, "r": 480.6, "b": 193.5, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 160.6, "r_x1": 145.9, "r_y1": 160.6, "r_x2": 145.9, "r_y2": 152.6, "r_x3": 139.4, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.2, "r_y0": 160.6, "r_x1": 480.6, "r_y1": 160.6, "r_x2": 480.6, "r_y2": 152.6, "r_x3": 150.2, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 171.6, "r_x1": 480.6, "r_y1": 171.6, "r_x2": 480.6, "r_y2": 163.5, "r_x3": 151.5, "r_y3": 163.5, "coord_origin": "TOPLEFT" }, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 182.5, "r_x1": 480.6, "r_y1": 182.5, "r_x2": 480.6, "r_y2": 174.5, "r_x3": 151.5, "r_y3": 174.5, "coord_origin": "TOPLEFT" }, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 193.5, "r_x1": 226.4, "r_y1": 193.5, "r_x2": 226.4, "r_y2": 185.4, "r_x3": 151.5, "r_y3": 185.4, "coord_origin": "TOPLEFT" }, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC). pp. 18681873. IEEE (2022)" }, { "label": "list_item", "id": 10, "page_no": 12, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 139.4, "t": 196.4, "r": 480.6, "b": 215.4, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 204.5, "r_x1": 146.3, "r_y1": 204.5, "r_x2": 146.3, "r_y2": 196.4, "r_x3": 139.4, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.8, "r_y0": 204.5, "r_x1": 480.6, "r_y1": 204.5, "r_x2": 480.6, "r_y2": 196.4, "r_x3": 150.8, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 215.4, "r_x1": 352.0, "r_y1": 215.4, "r_x2": 352.0, "r_y2": 207.4, "r_x3": 151.5, "r_y3": 207.4, "coord_origin": "TOPLEFT" }, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7. Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark dataset for table detection and recognition (2019)" }, { "label": "list_item", "id": 4, "page_no": 12, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.4, "t": 218.3, "r": 480.6, "b": 270.3, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 226.4, "r_x1": 146.4, "r_y1": 226.4, "r_x2": 146.4, "r_y2": 218.3, "r_x3": 139.4, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 226.4, "r_x1": 480.6, "r_y1": 226.4, "r_x2": 480.6, "r_y2": 218.3, "r_x3": 150.9, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 237.4, "r_x1": 480.6, "r_y1": 237.4, "r_x2": 480.6, "r_y2": 229.3, "r_x3": 151.5, "r_y3": 229.3, "coord_origin": "TOPLEFT" }, "text": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 248.3, "r_x1": 480.6, "r_y1": 248.3, "r_x2": 480.6, "r_y2": 240.3, "r_x3": 151.5, "r_y3": 240.3, "coord_origin": "TOPLEFT" }, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 259.3, "r_x1": 197.1, "r_y1": 259.3, "r_x2": 197.1, "r_y2": 251.2, "r_x3": 151.5, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.4, "r_y0": 259.1, "r_x1": 210.0, "r_y1": 259.1, "r_x2": 210.0, "r_y2": 251.2, "r_x3": 199.4, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.0, "r_y0": 259.3, "r_x1": 332.4, "r_y1": 259.3, "r_x2": 332.4, "r_y2": 251.2, "r_x3": 210.0, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.7, "r_y0": 259.3, "r_x1": 480.6, "r_y1": 259.3, "r_x2": 480.6, "r_y2": 251.9, "r_x3": 334.7, "r_y3": 251.9, "coord_origin": "TOPLEFT" }, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 270.3, "r_x1": 259.8, "r_y1": 270.3, "r_x2": 259.8, "r_y2": 262.8, "r_x3": 151.5, "r_y3": 262.8, "coord_origin": "TOPLEFT" }, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8. Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho, A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence 35 (17), 15137-15145 (May 2021), https://ojs.aaai.org/index.php/ AAAI/article/view/17777" }, { "label": "list_item", "id": 11, "page_no": 12, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 139.4, "t": 273.1, "r": 480.6, "b": 303.1, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 281.2, "r_x1": 146.1, "r_y1": 281.2, "r_x2": 146.1, "r_y2": 273.1, "r_x3": 139.4, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 281.2, "r_x1": 480.6, "r_y1": 281.2, "r_x2": 480.6, "r_y2": 273.1, "r_x3": 150.5, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 292.2, "r_x1": 480.6, "r_y1": 292.2, "r_x2": 480.6, "r_y2": 284.1, "r_x3": 151.5, "r_y3": 284.1, "coord_origin": "TOPLEFT" }, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 303.1, "r_x1": 473.4, "r_y1": 303.1, "r_x2": 473.4, "r_y2": 295.1, "r_x3": 151.5, "r_y3": 295.1, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9. Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure understanding with transformers. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)" }, { "label": "list_item", "id": 9, "page_no": 12, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 134.8, "t": 306.0, "r": 480.6, "b": 368.9, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 314.1, "r_x1": 146.5, "r_y1": 314.1, "r_x2": 146.5, "r_y2": 306.0, "r_x3": 134.8, "r_y3": 306.0, "coord_origin": "TOPLEFT" }, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.1, "r_y0": 314.1, "r_x1": 480.6, "r_y1": 314.1, "r_x2": 480.6, "r_y2": 306.0, "r_x3": 151.1, "r_y3": 306.0, "coord_origin": "TOPLEFT" }, "text": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "orig": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 325.1, "r_x1": 480.6, "r_y1": 325.1, "r_x2": 480.6, "r_y2": 317.0, "r_x3": 151.5, "r_y3": 317.0, "coord_origin": "TOPLEFT" }, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 336.0, "r_x1": 480.6, "r_y1": 336.0, "r_x2": 480.6, "r_y2": 328.0, "r_x3": 151.5, "r_y3": 328.0, "coord_origin": "TOPLEFT" }, "text": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 347.0, "r_x1": 480.6, "r_y1": 347.0, "r_x2": 480.6, "r_y2": 338.9, "r_x3": 151.5, "r_y3": 338.9, "coord_origin": "TOPLEFT" }, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 357.9, "r_x1": 251.1, "r_y1": 357.9, "r_x2": 251.1, "r_y2": 349.9, "r_x3": 151.5, "r_y3": 349.9, "coord_origin": "TOPLEFT" }, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 254.0, "r_y0": 358.0, "r_x1": 437.5, "r_y1": 358.0, "r_x2": 437.5, "r_y2": 350.5, "r_x3": 254.0, "r_y3": 350.5, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.5, "r_y0": 357.9, "r_x1": 440.1, "r_y1": 357.9, "r_x2": 440.1, "r_y2": 349.9, "r_x3": 437.5, "r_y3": 349.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.9, "r_y0": 358.0, "r_x1": 480.6, "r_y1": 358.0, "r_x2": 480.6, "r_y2": 350.5, "r_x3": 442.9, "r_y3": 350.5, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 368.9, "r_x1": 297.4, "r_y1": 368.9, "r_x2": 297.4, "r_y2": 361.5, "r_x3": 151.5, "r_y3": 361.5, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10. Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A large human-annotated dataset for document-layout segmentation. In: Zhang, A., Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp. 3743-3751. ACM (2022). https://doi.org/10.1145/3534678.3539043 , https:// doi.org/10.1145/3534678.3539043" }, { "label": "list_item", "id": 0, "page_no": 12, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 134.8, "t": 371.8, "r": 480.6, "b": 412.7, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 379.9, "r_x1": 146.0, "r_y1": 379.9, "r_x2": 146.0, "r_y2": 371.8, "r_x3": 134.8, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 379.9, "r_x1": 480.6, "r_y1": 379.9, "r_x2": 480.6, "r_y2": 371.8, "r_x3": 150.5, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 390.8, "r_x1": 480.6, "r_y1": 390.8, "r_x2": 480.6, "r_y2": 382.8, "r_x3": 151.5, "r_y3": 382.8, "coord_origin": "TOPLEFT" }, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 401.8, "r_x1": 480.6, "r_y1": 401.8, "r_x2": 480.6, "r_y2": 393.7, "r_x3": 151.5, "r_y3": 393.7, "coord_origin": "TOPLEFT" }, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 412.7, "r_x1": 373.8, "r_y1": 412.7, "r_x2": 373.8, "r_y2": 404.7, "r_x3": 151.5, "r_y3": 404.7, "coord_origin": "TOPLEFT" }, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11. Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet: An approach for end to end table detection and structure recognition from imagebased documents. In: Proceedings of the IEEE/CVF conference on computer vision and pattern recognition workshops. pp. 572-573 (2020)" }, { "label": "list_item", "id": 3, "page_no": 12, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 134.8, "t": 415.6, "r": 480.6, "b": 456.6, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 423.7, "r_x1": 145.9, "r_y1": 423.7, "r_x2": 145.9, "r_y2": 415.6, "r_x3": 134.8, "r_y3": 415.6, "coord_origin": "TOPLEFT" }, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.3, "r_y0": 423.7, "r_x1": 480.6, "r_y1": 423.7, "r_x2": 480.6, "r_y2": 415.6, "r_x3": 150.3, "r_y3": 415.6, "coord_origin": "TOPLEFT" }, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 434.7, "r_x1": 480.6, "r_y1": 434.7, "r_x2": 480.6, "r_y2": 426.6, "r_x3": 151.5, "r_y3": 426.6, "coord_origin": "TOPLEFT" }, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 445.6, "r_x1": 480.6, "r_y1": 445.6, "r_x2": 480.6, "r_y2": 437.6, "r_x3": 151.5, "r_y3": 437.6, "coord_origin": "TOPLEFT" }, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 456.6, "r_x1": 292.9, "r_y1": 456.6, "r_x2": 292.9, "r_y2": 448.5, "r_x3": 151.5, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12. Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In: 2017 14th IAPR international conference on document analysis and recognition (ICDAR). vol. 1, pp. 1162-1167. IEEE (2017)" }, { "label": "list_item", "id": 7, "page_no": 12, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 134.8, "t": 459.5, "r": 480.6, "b": 500.5, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 467.6, "r_x1": 145.8, "r_y1": 467.6, "r_x2": 145.8, "r_y2": 459.5, "r_x3": 134.8, "r_y3": 459.5, "coord_origin": "TOPLEFT" }, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.1, "r_y0": 467.6, "r_x1": 480.6, "r_y1": 467.6, "r_x2": 480.6, "r_y2": 459.5, "r_x3": 150.1, "r_y3": 459.5, "coord_origin": "TOPLEFT" }, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 478.5, "r_x1": 480.6, "r_y1": 478.5, "r_x2": 480.6, "r_y2": 470.5, "r_x3": 151.5, "r_y3": 470.5, "coord_origin": "TOPLEFT" }, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 489.5, "r_x1": 439.1, "r_y1": 489.5, "r_x2": 439.1, "r_y2": 481.4, "r_x3": 151.5, "r_y3": 481.4, "coord_origin": "TOPLEFT" }, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.9, "r_y0": 489.5, "r_x1": 480.6, "r_y1": 489.5, "r_x2": 480.6, "r_y2": 482.1, "r_x3": 442.9, "r_y3": 482.1, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 500.5, "r_x1": 302.1, "r_y1": 500.5, "r_x2": 302.1, "r_y2": 493.0, "r_x3": 151.5, "r_y3": 493.0, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13. Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep learning based table structure recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019). https:// doi.org/10.1109/ICDAR.2019.00226" }, { "label": "list_item", "id": 2, "page_no": 12, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 134.8, "t": 503.3, "r": 480.6, "b": 544.3, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 511.4, "r_x1": 146.2, "r_y1": 511.4, "r_x2": 146.2, "r_y2": 503.3, "r_x3": 134.8, "r_y3": 503.3, "coord_origin": "TOPLEFT" }, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.6, "r_y0": 511.4, "r_x1": 480.6, "r_y1": 511.4, "r_x2": 480.6, "r_y2": 503.3, "r_x3": 150.6, "r_y3": 503.3, "coord_origin": "TOPLEFT" }, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 522.4, "r_x1": 480.6, "r_y1": 522.4, "r_x2": 480.6, "r_y2": 514.3, "r_x3": 151.5, "r_y3": 514.3, "coord_origin": "TOPLEFT" }, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 525.3, "r_x3": 151.5, "r_y3": 525.3, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 544.3, "r_x1": 199.2, "r_y1": 544.3, "r_x2": 199.2, "r_y2": 536.2, "r_x3": 151.5, "r_y3": 536.2, "coord_origin": "TOPLEFT" }, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14. Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive table extraction from unstructured documents. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642 (June 2022)" }, { "label": "list_item", "id": 6, "page_no": 12, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 134.8, "t": 547.2, "r": 480.6, "b": 610.1, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 555.3, "r_x1": 146.2, "r_y1": 555.3, "r_x2": 146.2, "r_y2": 547.2, "r_x3": 134.8, "r_y3": 547.2, "coord_origin": "TOPLEFT" }, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.6, "r_y0": 555.3, "r_x1": 480.6, "r_y1": 555.3, "r_x2": 480.6, "r_y2": 547.2, "r_x3": 150.6, "r_y3": 547.2, "coord_origin": "TOPLEFT" }, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 566.2, "r_x1": 480.6, "r_y1": 566.2, "r_x2": 480.6, "r_y2": 558.1, "r_x3": 151.5, "r_y3": 558.1, "coord_origin": "TOPLEFT" }, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 577.2, "r_x1": 480.6, "r_y1": 577.2, "r_x2": 480.6, "r_y2": 569.1, "r_x3": 151.5, "r_y3": 569.1, "coord_origin": "TOPLEFT" }, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 588.1, "r_x1": 480.6, "r_y1": 588.1, "r_x2": 480.6, "r_y2": 580.1, "r_x3": 151.5, "r_y3": 580.1, "coord_origin": "TOPLEFT" }, "text": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 599.1, "r_x1": 200.8, "r_y1": 599.1, "r_x2": 200.8, "r_y2": 591.0, "r_x3": 151.5, "r_y3": 591.0, "coord_origin": "TOPLEFT" }, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 202.9, "r_y0": 599.1, "r_x1": 386.5, "r_y1": 599.1, "r_x2": 386.5, "r_y2": 591.7, "r_x3": 202.9, "r_y3": 591.7, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.5, "r_y0": 599.1, "r_x1": 389.0, "r_y1": 599.1, "r_x2": 389.0, "r_y2": 591.0, "r_x3": 386.5, "r_y3": 591.0, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.2, "r_y0": 599.1, "r_x1": 480.6, "r_y1": 599.1, "r_x2": 480.6, "r_y2": 591.7, "r_x3": 391.2, "r_y3": 591.7, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 610.1, "r_x1": 245.6, "r_y1": 610.1, "r_x2": 245.6, "r_y2": 602.6, "r_x3": 151.5, "r_y3": 602.6, "coord_origin": "TOPLEFT" }, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "15. Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A machine learning platform to ingest documents at scale. In: Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY, USA (2018). https://doi.org/10.1145/3219819.3219834 , https://doi.org/10. 1145/3219819.3219834" }, { "label": "list_item", "id": 12, "page_no": 12, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 134.8, "t": 613.0, "r": 480.6, "b": 632.0, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 621.0, "r_x1": 146.6, "r_y1": 621.0, "r_x2": 146.6, "r_y2": 613.0, "r_x3": 134.8, "r_y3": 613.0, "coord_origin": "TOPLEFT" }, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.3, "r_y0": 621.0, "r_x1": 480.6, "r_y1": 621.0, "r_x2": 480.6, "r_y2": 613.0, "r_x3": 151.3, "r_y3": 613.0, "coord_origin": "TOPLEFT" }, "text": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "orig": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 632.0, "r_x1": 234.4, "r_y1": 632.0, "r_x2": 234.4, "r_y2": 623.9, "r_x3": 151.5, "r_y3": 623.9, "coord_origin": "TOPLEFT" }, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "16. Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN (1996), aAINN09397" }, { "label": "list_item", "id": 8, "page_no": 12, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 134.8, "t": 634.9, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 642.9, "r_x1": 146.3, "r_y1": 642.9, "r_x2": 146.3, "r_y2": 634.9, "r_x3": 134.8, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.8, "r_y0": 642.9, "r_x1": 480.6, "r_y1": 642.9, "r_x2": 480.6, "r_y2": 634.9, "r_x3": 150.8, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 653.9, "r_x1": 480.6, "r_y1": 653.9, "r_x2": 480.6, "r_y2": 645.8, "r_x3": 151.5, "r_y3": 645.8, "coord_origin": "TOPLEFT" }, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 664.9, "r_x1": 299.3, "r_y1": 664.9, "r_x2": 299.3, "r_y2": 656.8, "r_x3": 151.5, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "17. Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table images. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 749-755. IEEE (2019)" } ], "body": [ { "label": "list_item", "id": 5, "page_no": 12, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.4, "t": 119.7, "r": 480.6, "b": 149.7, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 127.7, "r_x1": 146.0, "r_y1": 127.7, "r_x2": 146.0, "r_y2": 119.7, "r_x3": 139.4, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.3, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 119.7, "r_x3": 150.3, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 138.7, "r_x1": 480.6, "r_y1": 138.7, "r_x2": 480.6, "r_y2": 130.6, "r_x3": 151.5, "r_y3": 130.6, "coord_origin": "TOPLEFT" }, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 149.7, "r_x1": 304.0, "r_y1": 149.7, "r_x2": 304.0, "r_y2": 141.6, "r_x3": 151.5, "r_y3": 141.6, "coord_origin": "TOPLEFT" }, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content extraction from scientific tables. International Journal on Document Analysis and Recognition (IJDAR) pp. 1-10 (2022)" }, { "label": "list_item", "id": 1, "page_no": 12, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 139.4, "t": 152.6, "r": 480.6, "b": 193.5, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 160.6, "r_x1": 145.9, "r_y1": 160.6, "r_x2": 145.9, "r_y2": 152.6, "r_x3": 139.4, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.2, "r_y0": 160.6, "r_x1": 480.6, "r_y1": 160.6, "r_x2": 480.6, "r_y2": 152.6, "r_x3": 150.2, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 171.6, "r_x1": 480.6, "r_y1": 171.6, "r_x2": 480.6, "r_y2": 163.5, "r_x3": 151.5, "r_y3": 163.5, "coord_origin": "TOPLEFT" }, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 182.5, "r_x1": 480.6, "r_y1": 182.5, "r_x2": 480.6, "r_y2": 174.5, "r_x3": 151.5, "r_y3": 174.5, "coord_origin": "TOPLEFT" }, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 193.5, "r_x1": 226.4, "r_y1": 193.5, "r_x2": 226.4, "r_y2": 185.4, "r_x3": 151.5, "r_y3": 185.4, "coord_origin": "TOPLEFT" }, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC). pp. 18681873. IEEE (2022)" }, { "label": "list_item", "id": 10, "page_no": 12, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 139.4, "t": 196.4, "r": 480.6, "b": 215.4, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 204.5, "r_x1": 146.3, "r_y1": 204.5, "r_x2": 146.3, "r_y2": 196.4, "r_x3": 139.4, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.8, "r_y0": 204.5, "r_x1": 480.6, "r_y1": 204.5, "r_x2": 480.6, "r_y2": 196.4, "r_x3": 150.8, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 215.4, "r_x1": 352.0, "r_y1": 215.4, "r_x2": 352.0, "r_y2": 207.4, "r_x3": 151.5, "r_y3": 207.4, "coord_origin": "TOPLEFT" }, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7. Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark dataset for table detection and recognition (2019)" }, { "label": "list_item", "id": 4, "page_no": 12, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.4, "t": 218.3, "r": 480.6, "b": 270.3, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 226.4, "r_x1": 146.4, "r_y1": 226.4, "r_x2": 146.4, "r_y2": 218.3, "r_x3": 139.4, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 226.4, "r_x1": 480.6, "r_y1": 226.4, "r_x2": 480.6, "r_y2": 218.3, "r_x3": 150.9, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 237.4, "r_x1": 480.6, "r_y1": 237.4, "r_x2": 480.6, "r_y2": 229.3, "r_x3": 151.5, "r_y3": 229.3, "coord_origin": "TOPLEFT" }, "text": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 248.3, "r_x1": 480.6, "r_y1": 248.3, "r_x2": 480.6, "r_y2": 240.3, "r_x3": 151.5, "r_y3": 240.3, "coord_origin": "TOPLEFT" }, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 259.3, "r_x1": 197.1, "r_y1": 259.3, "r_x2": 197.1, "r_y2": 251.2, "r_x3": 151.5, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.4, "r_y0": 259.1, "r_x1": 210.0, "r_y1": 259.1, "r_x2": 210.0, "r_y2": 251.2, "r_x3": 199.4, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.0, "r_y0": 259.3, "r_x1": 332.4, "r_y1": 259.3, "r_x2": 332.4, "r_y2": 251.2, "r_x3": 210.0, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.7, "r_y0": 259.3, "r_x1": 480.6, "r_y1": 259.3, "r_x2": 480.6, "r_y2": 251.9, "r_x3": 334.7, "r_y3": 251.9, "coord_origin": "TOPLEFT" }, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 270.3, "r_x1": 259.8, "r_y1": 270.3, "r_x2": 259.8, "r_y2": 262.8, "r_x3": 151.5, "r_y3": 262.8, "coord_origin": "TOPLEFT" }, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8. Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho, A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence 35 (17), 15137-15145 (May 2021), https://ojs.aaai.org/index.php/ AAAI/article/view/17777" }, { "label": "list_item", "id": 11, "page_no": 12, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 139.4, "t": 273.1, "r": 480.6, "b": 303.1, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.4, "r_y0": 281.2, "r_x1": 146.1, "r_y1": 281.2, "r_x2": 146.1, "r_y2": 273.1, "r_x3": 139.4, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 281.2, "r_x1": 480.6, "r_y1": 281.2, "r_x2": 480.6, "r_y2": 273.1, "r_x3": 150.5, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 292.2, "r_x1": 480.6, "r_y1": 292.2, "r_x2": 480.6, "r_y2": 284.1, "r_x3": 151.5, "r_y3": 284.1, "coord_origin": "TOPLEFT" }, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 303.1, "r_x1": 473.4, "r_y1": 303.1, "r_x2": 473.4, "r_y2": 295.1, "r_x3": 151.5, "r_y3": 295.1, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9. Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure understanding with transformers. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)" }, { "label": "list_item", "id": 9, "page_no": 12, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 134.8, "t": 306.0, "r": 480.6, "b": 368.9, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 314.1, "r_x1": 146.5, "r_y1": 314.1, "r_x2": 146.5, "r_y2": 306.0, "r_x3": 134.8, "r_y3": 306.0, "coord_origin": "TOPLEFT" }, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.1, "r_y0": 314.1, "r_x1": 480.6, "r_y1": 314.1, "r_x2": 480.6, "r_y2": 306.0, "r_x3": 151.1, "r_y3": 306.0, "coord_origin": "TOPLEFT" }, "text": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "orig": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 325.1, "r_x1": 480.6, "r_y1": 325.1, "r_x2": 480.6, "r_y2": 317.0, "r_x3": 151.5, "r_y3": 317.0, "coord_origin": "TOPLEFT" }, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 336.0, "r_x1": 480.6, "r_y1": 336.0, "r_x2": 480.6, "r_y2": 328.0, "r_x3": 151.5, "r_y3": 328.0, "coord_origin": "TOPLEFT" }, "text": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 347.0, "r_x1": 480.6, "r_y1": 347.0, "r_x2": 480.6, "r_y2": 338.9, "r_x3": 151.5, "r_y3": 338.9, "coord_origin": "TOPLEFT" }, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 357.9, "r_x1": 251.1, "r_y1": 357.9, "r_x2": 251.1, "r_y2": 349.9, "r_x3": 151.5, "r_y3": 349.9, "coord_origin": "TOPLEFT" }, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 254.0, "r_y0": 358.0, "r_x1": 437.5, "r_y1": 358.0, "r_x2": 437.5, "r_y2": 350.5, "r_x3": 254.0, "r_y3": 350.5, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.5, "r_y0": 357.9, "r_x1": 440.1, "r_y1": 357.9, "r_x2": 440.1, "r_y2": 349.9, "r_x3": 437.5, "r_y3": 349.9, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.9, "r_y0": 358.0, "r_x1": 480.6, "r_y1": 358.0, "r_x2": 480.6, "r_y2": 350.5, "r_x3": 442.9, "r_y3": 350.5, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 368.9, "r_x1": 297.4, "r_y1": 368.9, "r_x2": 297.4, "r_y2": 361.5, "r_x3": 151.5, "r_y3": 361.5, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10. Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A large human-annotated dataset for document-layout segmentation. In: Zhang, A., Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp. 3743-3751. ACM (2022). https://doi.org/10.1145/3534678.3539043 , https:// doi.org/10.1145/3534678.3539043" }, { "label": "list_item", "id": 0, "page_no": 12, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 134.8, "t": 371.8, "r": 480.6, "b": 412.7, "coord_origin": "TOPLEFT" }, "confidence": 0.98, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 379.9, "r_x1": 146.0, "r_y1": 379.9, "r_x2": 146.0, "r_y2": 371.8, "r_x3": 134.8, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 379.9, "r_x1": 480.6, "r_y1": 379.9, "r_x2": 480.6, "r_y2": 371.8, "r_x3": 150.5, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 390.8, "r_x1": 480.6, "r_y1": 390.8, "r_x2": 480.6, "r_y2": 382.8, "r_x3": 151.5, "r_y3": 382.8, "coord_origin": "TOPLEFT" }, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 401.8, "r_x1": 480.6, "r_y1": 401.8, "r_x2": 480.6, "r_y2": 393.7, "r_x3": 151.5, "r_y3": 393.7, "coord_origin": "TOPLEFT" }, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 412.7, "r_x1": 373.8, "r_y1": 412.7, "r_x2": 373.8, "r_y2": 404.7, "r_x3": 151.5, "r_y3": 404.7, "coord_origin": "TOPLEFT" }, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11. Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet: An approach for end to end table detection and structure recognition from imagebased documents. In: Proceedings of the IEEE/CVF conference on computer vision and pattern recognition workshops. pp. 572-573 (2020)" }, { "label": "list_item", "id": 3, "page_no": 12, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 134.8, "t": 415.6, "r": 480.6, "b": 456.6, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 423.7, "r_x1": 145.9, "r_y1": 423.7, "r_x2": 145.9, "r_y2": 415.6, "r_x3": 134.8, "r_y3": 415.6, "coord_origin": "TOPLEFT" }, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.3, "r_y0": 423.7, "r_x1": 480.6, "r_y1": 423.7, "r_x2": 480.6, "r_y2": 415.6, "r_x3": 150.3, "r_y3": 415.6, "coord_origin": "TOPLEFT" }, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 434.7, "r_x1": 480.6, "r_y1": 434.7, "r_x2": 480.6, "r_y2": 426.6, "r_x3": 151.5, "r_y3": 426.6, "coord_origin": "TOPLEFT" }, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 445.6, "r_x1": 480.6, "r_y1": 445.6, "r_x2": 480.6, "r_y2": 437.6, "r_x3": 151.5, "r_y3": 437.6, "coord_origin": "TOPLEFT" }, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 456.6, "r_x1": 292.9, "r_y1": 456.6, "r_x2": 292.9, "r_y2": 448.5, "r_x3": 151.5, "r_y3": 448.5, "coord_origin": "TOPLEFT" }, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12. Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In: 2017 14th IAPR international conference on document analysis and recognition (ICDAR). vol. 1, pp. 1162-1167. IEEE (2017)" }, { "label": "list_item", "id": 7, "page_no": 12, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 134.8, "t": 459.5, "r": 480.6, "b": 500.5, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 467.6, "r_x1": 145.8, "r_y1": 467.6, "r_x2": 145.8, "r_y2": 459.5, "r_x3": 134.8, "r_y3": 459.5, "coord_origin": "TOPLEFT" }, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.1, "r_y0": 467.6, "r_x1": 480.6, "r_y1": 467.6, "r_x2": 480.6, "r_y2": 459.5, "r_x3": 150.1, "r_y3": 459.5, "coord_origin": "TOPLEFT" }, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 478.5, "r_x1": 480.6, "r_y1": 478.5, "r_x2": 480.6, "r_y2": 470.5, "r_x3": 151.5, "r_y3": 470.5, "coord_origin": "TOPLEFT" }, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 489.5, "r_x1": 439.1, "r_y1": 489.5, "r_x2": 439.1, "r_y2": 481.4, "r_x3": 151.5, "r_y3": 481.4, "coord_origin": "TOPLEFT" }, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.9, "r_y0": 489.5, "r_x1": 480.6, "r_y1": 489.5, "r_x2": 480.6, "r_y2": 482.1, "r_x3": 442.9, "r_y3": 482.1, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 500.5, "r_x1": 302.1, "r_y1": 500.5, "r_x2": 302.1, "r_y2": 493.0, "r_x3": 151.5, "r_y3": 493.0, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13. Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep learning based table structure recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019). https:// doi.org/10.1109/ICDAR.2019.00226" }, { "label": "list_item", "id": 2, "page_no": 12, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 134.8, "t": 503.3, "r": 480.6, "b": 544.3, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 511.4, "r_x1": 146.2, "r_y1": 511.4, "r_x2": 146.2, "r_y2": 503.3, "r_x3": 134.8, "r_y3": 503.3, "coord_origin": "TOPLEFT" }, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.6, "r_y0": 511.4, "r_x1": 480.6, "r_y1": 511.4, "r_x2": 480.6, "r_y2": 503.3, "r_x3": 150.6, "r_y3": 503.3, "coord_origin": "TOPLEFT" }, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 522.4, "r_x1": 480.6, "r_y1": 522.4, "r_x2": 480.6, "r_y2": 514.3, "r_x3": 151.5, "r_y3": 514.3, "coord_origin": "TOPLEFT" }, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 533.3, "r_x1": 480.6, "r_y1": 533.3, "r_x2": 480.6, "r_y2": 525.3, "r_x3": 151.5, "r_y3": 525.3, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 544.3, "r_x1": 199.2, "r_y1": 544.3, "r_x2": 199.2, "r_y2": 536.2, "r_x3": 151.5, "r_y3": 536.2, "coord_origin": "TOPLEFT" }, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14. Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive table extraction from unstructured documents. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642 (June 2022)" }, { "label": "list_item", "id": 6, "page_no": 12, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 134.8, "t": 547.2, "r": 480.6, "b": 610.1, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 555.3, "r_x1": 146.2, "r_y1": 555.3, "r_x2": 146.2, "r_y2": 547.2, "r_x3": 134.8, "r_y3": 547.2, "coord_origin": "TOPLEFT" }, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.6, "r_y0": 555.3, "r_x1": 480.6, "r_y1": 555.3, "r_x2": 480.6, "r_y2": 547.2, "r_x3": 150.6, "r_y3": 547.2, "coord_origin": "TOPLEFT" }, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 566.2, "r_x1": 480.6, "r_y1": 566.2, "r_x2": 480.6, "r_y2": 558.1, "r_x3": 151.5, "r_y3": 558.1, "coord_origin": "TOPLEFT" }, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 577.2, "r_x1": 480.6, "r_y1": 577.2, "r_x2": 480.6, "r_y2": 569.1, "r_x3": 151.5, "r_y3": 569.1, "coord_origin": "TOPLEFT" }, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 588.1, "r_x1": 480.6, "r_y1": 588.1, "r_x2": 480.6, "r_y2": 580.1, "r_x3": 151.5, "r_y3": 580.1, "coord_origin": "TOPLEFT" }, "text": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 599.1, "r_x1": 200.8, "r_y1": 599.1, "r_x2": 200.8, "r_y2": 591.0, "r_x3": 151.5, "r_y3": 591.0, "coord_origin": "TOPLEFT" }, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 202.9, "r_y0": 599.1, "r_x1": 386.5, "r_y1": 599.1, "r_x2": 386.5, "r_y2": 591.7, "r_x3": 202.9, "r_y3": 591.7, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.5, "r_y0": 599.1, "r_x1": 389.0, "r_y1": 599.1, "r_x2": 389.0, "r_y2": 591.0, "r_x3": 386.5, "r_y3": 591.0, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.2, "r_y0": 599.1, "r_x1": 480.6, "r_y1": 599.1, "r_x2": 480.6, "r_y2": 591.7, "r_x3": 391.2, "r_y3": 591.7, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 610.1, "r_x1": 245.6, "r_y1": 610.1, "r_x2": 245.6, "r_y2": 602.6, "r_x3": 151.5, "r_y3": 602.6, "coord_origin": "TOPLEFT" }, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "15. Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A machine learning platform to ingest documents at scale. In: Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY, USA (2018). https://doi.org/10.1145/3219819.3219834 , https://doi.org/10. 1145/3219819.3219834" }, { "label": "list_item", "id": 12, "page_no": 12, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 134.8, "t": 613.0, "r": 480.6, "b": 632.0, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 621.0, "r_x1": 146.6, "r_y1": 621.0, "r_x2": 146.6, "r_y2": 613.0, "r_x3": 134.8, "r_y3": 613.0, "coord_origin": "TOPLEFT" }, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.3, "r_y0": 621.0, "r_x1": 480.6, "r_y1": 621.0, "r_x2": 480.6, "r_y2": 613.0, "r_x3": 151.3, "r_y3": 613.0, "coord_origin": "TOPLEFT" }, "text": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "orig": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 632.0, "r_x1": 234.4, "r_y1": 632.0, "r_x2": 234.4, "r_y2": 623.9, "r_x3": 151.5, "r_y3": 623.9, "coord_origin": "TOPLEFT" }, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "16. Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN (1996), aAINN09397" }, { "label": "list_item", "id": 8, "page_no": 12, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 134.8, "t": 634.9, "r": 480.6, "b": 664.9, "coord_origin": "TOPLEFT" }, "confidence": 0.96, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 642.9, "r_x1": 146.3, "r_y1": 642.9, "r_x2": 146.3, "r_y2": 634.9, "r_x3": 134.8, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.8, "r_y0": 642.9, "r_x1": 480.6, "r_y1": 642.9, "r_x2": 480.6, "r_y2": 634.9, "r_x3": 150.8, "r_y3": 634.9, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 653.9, "r_x1": 480.6, "r_y1": 653.9, "r_x2": 480.6, "r_y2": 645.8, "r_x3": 151.5, "r_y3": 645.8, "coord_origin": "TOPLEFT" }, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 664.9, "r_x1": 299.3, "r_y1": 664.9, "r_x2": 299.3, "r_y2": 656.8, "r_x3": 151.5, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "17. Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table images. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 749-755. IEEE (2019)" } ], "headers": [ { "label": "page_header", "id": 13, "page_no": 12, "cluster": { "id": 13, "label": "page_header", "bbox": { "l": 194.5, "t": 93.8, "r": 447.5, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.92, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.5, "r_y0": 101.8, "r_x1": 447.5, "r_y1": 101.8, "r_x2": 447.5, "r_y2": 93.8, "r_x3": 194.5, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 14, "page_no": 12, "cluster": { "id": 14, "label": "page_header", "bbox": { "l": 471.4, "t": 93.8, "r": 480.6, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.91, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.4, "r_y0": 101.8, "r_x1": 480.6, "r_y1": 101.8, "r_x2": 480.6, "r_y2": 93.8, "r_x3": 471.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13" } ] } }, { "page_no": 13, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 144.0, "r_y1": 101.8, "r_x2": 144.0, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 146.1, "r_y1": 127.7, "r_x2": 146.1, "r_y2": 119.7, "r_x3": 134.8, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 119.7, "r_x3": 150.5, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 138.7, "r_x1": 480.6, "r_y1": 138.7, "r_x2": 480.6, "r_y2": 130.6, "r_x3": 151.5, "r_y3": 130.6, "coord_origin": "TOPLEFT" }, "text": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "orig": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 149.7, "r_x1": 427.5, "r_y1": 149.7, "r_x2": 427.5, "r_y2": 141.6, "r_x3": 151.5, "r_y3": 141.6, "coord_origin": "TOPLEFT" }, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 160.6, "r_x1": 146.2, "r_y1": 160.6, "r_x2": 146.2, "r_y2": 152.6, "r_x3": 134.8, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.7, "r_y0": 160.6, "r_x1": 480.6, "r_y1": 160.6, "r_x2": 480.6, "r_y2": 152.6, "r_x3": 150.7, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "orig": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 171.6, "r_x1": 480.6, "r_y1": 171.6, "r_x2": 480.6, "r_y2": 163.5, "r_x3": 151.5, "r_y3": 163.5, "coord_origin": "TOPLEFT" }, "text": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "orig": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 182.5, "r_x1": 280.6, "r_y1": 182.5, "r_x2": 280.6, "r_y2": 174.5, "r_x3": 151.5, "r_y3": 174.5, "coord_origin": "TOPLEFT" }, "text": "ble recognition to html (2021).", "orig": "ble recognition to html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.1, "r_y0": 182.6, "r_x1": 478.0, "r_y1": 182.6, "r_x2": 478.0, "r_y2": 175.1, "r_x3": 285.1, "r_y3": 175.1, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0, "r_y0": 182.5, "r_x1": 480.6, "r_y1": 182.5, "r_x2": 480.6, "r_y2": 174.5, "r_x3": 478.0, "r_y3": 174.5, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 193.5, "r_x1": 302.1, "r_y1": 193.5, "r_x2": 302.1, "r_y2": 186.1, "r_x3": 151.5, "r_y3": 186.1, "coord_origin": "TOPLEFT" }, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 204.5, "r_x1": 145.7, "r_y1": 204.5, "r_x2": 145.7, "r_y2": 196.4, "r_x3": 134.8, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.9, "r_y0": 204.5, "r_x1": 480.6, "r_y1": 204.5, "r_x2": 480.6, "r_y2": 196.4, "r_x3": 149.9, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 215.4, "r_x1": 318.6, "r_y1": 215.4, "r_x2": 318.6, "r_y2": 207.3, "r_x3": 151.5, "r_y3": 207.3, "coord_origin": "TOPLEFT" }, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.6, "r_y0": 215.2, "r_x1": 337.5, "r_y1": 215.2, "r_x2": 337.5, "r_y2": 207.3, "r_x3": 321.6, "r_y3": 207.3, "coord_origin": "TOPLEFT" }, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.5, "r_y0": 215.4, "r_x1": 399.5, "r_y1": 215.4, "r_x2": 399.5, "r_y2": 207.3, "r_x3": 337.5, "r_y3": 207.3, "coord_origin": "TOPLEFT" }, "text": ", 108565 (2022)", "orig": ", 108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 226.4, "r_x1": 145.7, "r_y1": 226.4, "r_x2": 145.7, "r_y2": 218.3, "r_x3": 134.8, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.0, "r_y0": 226.4, "r_x1": 480.6, "r_y1": 226.4, "r_x2": 480.6, "r_y2": 218.3, "r_x3": 150.0, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 237.3, "r_x1": 480.6, "r_y1": 237.3, "r_x2": 480.6, "r_y2": 229.3, "r_x3": 151.5, "r_y3": 229.3, "coord_origin": "TOPLEFT" }, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 248.3, "r_x1": 480.6, "r_y1": 248.3, "r_x2": 480.6, "r_y2": 240.2, "r_x3": 151.5, "r_y3": 240.2, "coord_origin": "TOPLEFT" }, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 259.3, "r_x1": 293.4, "r_y1": 259.3, "r_x2": 293.4, "r_y2": 251.2, "r_x3": 151.5, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 297.0, "r_y0": 259.3, "r_x1": 480.6, "r_y1": 259.3, "r_x2": 480.6, "r_y2": 251.8, "r_x3": 297.0, "r_y3": 251.8, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 270.3, "r_x1": 175.1, "r_y1": 270.3, "r_x2": 175.1, "r_y2": 262.8, "r_x3": 151.5, "r_y3": 262.8, "coord_origin": "TOPLEFT" }, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 281.2, "r_x1": 146.4, "r_y1": 281.2, "r_x2": 146.4, "r_y2": 273.1, "r_x3": 134.8, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 281.2, "r_x1": 480.6, "r_y1": 281.2, "r_x2": 480.6, "r_y2": 273.1, "r_x3": 150.9, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "orig": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 292.1, "r_x1": 480.6, "r_y1": 292.1, "r_x2": 480.6, "r_y2": 284.1, "r_x3": 151.5, "r_y3": 284.1, "coord_origin": "TOPLEFT" }, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 303.1, "r_x1": 480.6, "r_y1": 303.1, "r_x2": 480.6, "r_y2": 295.0, "r_x3": 151.5, "r_y3": 295.0, "coord_origin": "TOPLEFT" }, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 314.0, "r_x1": 236.0, "r_y1": 314.0, "r_x2": 236.0, "r_y2": 306.0, "r_x3": 151.5, "r_y3": 306.0, "coord_origin": "TOPLEFT" }, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 325.0, "r_x1": 145.7, "r_y1": 325.0, "r_x2": 145.7, "r_y2": 316.9, "r_x3": 134.8, "r_y3": 316.9, "coord_origin": "TOPLEFT" }, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.0, "r_y0": 325.0, "r_x1": 480.6, "r_y1": 325.0, "r_x2": 480.6, "r_y2": 316.9, "r_x3": 150.0, "r_y3": 316.9, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 336.0, "r_x1": 480.6, "r_y1": 336.0, "r_x2": 480.6, "r_y2": 327.9, "r_x3": 151.5, "r_y3": 327.9, "coord_origin": "TOPLEFT" }, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 346.9, "r_x1": 335.1, "r_y1": 346.9, "r_x2": 335.1, "r_y2": 338.9, "r_x3": 151.5, "r_y3": 338.9, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 7, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 144.0, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.7, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 144.0, "r_y1": 101.8, "r_x2": 144.0, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.79, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 134.8, "t": 119.7, "r": 480.6, "b": 149.7, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 146.1, "r_y1": 127.7, "r_x2": 146.1, "r_y2": 119.7, "r_x3": 134.8, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 119.7, "r_x3": 150.5, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 138.7, "r_x1": 480.6, "r_y1": 138.7, "r_x2": 480.6, "r_y2": 130.6, "r_x3": 151.5, "r_y3": 130.6, "coord_origin": "TOPLEFT" }, "text": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "orig": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 149.7, "r_x1": 427.5, "r_y1": 149.7, "r_x2": 427.5, "r_y2": 141.6, "r_x3": 151.5, "r_y3": 141.6, "coord_origin": "TOPLEFT" }, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 134.8, "t": 152.6, "r": 480.6, "b": 193.5, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 160.6, "r_x1": 146.2, "r_y1": 160.6, "r_x2": 146.2, "r_y2": 152.6, "r_x3": 134.8, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.7, "r_y0": 160.6, "r_x1": 480.6, "r_y1": 160.6, "r_x2": 480.6, "r_y2": 152.6, "r_x3": 150.7, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "orig": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 171.6, "r_x1": 480.6, "r_y1": 171.6, "r_x2": 480.6, "r_y2": 163.5, "r_x3": 151.5, "r_y3": 163.5, "coord_origin": "TOPLEFT" }, "text": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "orig": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 182.5, "r_x1": 280.6, "r_y1": 182.5, "r_x2": 280.6, "r_y2": 174.5, "r_x3": 151.5, "r_y3": 174.5, "coord_origin": "TOPLEFT" }, "text": "ble recognition to html (2021).", "orig": "ble recognition to html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.1, "r_y0": 182.6, "r_x1": 478.0, "r_y1": 182.6, "r_x2": 478.0, "r_y2": 175.1, "r_x3": 285.1, "r_y3": 175.1, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0, "r_y0": 182.5, "r_x1": 480.6, "r_y1": 182.5, "r_x2": 480.6, "r_y2": 174.5, "r_x3": 478.0, "r_y3": 174.5, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 193.5, "r_x1": 302.1, "r_y1": 193.5, "r_x2": 302.1, "r_y2": 186.1, "r_x3": 151.5, "r_y3": 186.1, "coord_origin": "TOPLEFT" }, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 134.8, "t": 196.4, "r": 480.6, "b": 215.4, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 204.5, "r_x1": 145.7, "r_y1": 204.5, "r_x2": 145.7, "r_y2": 196.4, "r_x3": 134.8, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.9, "r_y0": 204.5, "r_x1": 480.6, "r_y1": 204.5, "r_x2": 480.6, "r_y2": 196.4, "r_x3": 149.9, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 215.4, "r_x1": 318.6, "r_y1": 215.4, "r_x2": 318.6, "r_y2": 207.3, "r_x3": 151.5, "r_y3": 207.3, "coord_origin": "TOPLEFT" }, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.6, "r_y0": 215.2, "r_x1": 337.5, "r_y1": 215.2, "r_x2": 337.5, "r_y2": 207.3, "r_x3": 321.6, "r_y3": 207.3, "coord_origin": "TOPLEFT" }, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.5, "r_y0": 215.4, "r_x1": 399.5, "r_y1": 215.4, "r_x2": 399.5, "r_y2": 207.3, "r_x3": 337.5, "r_y3": 207.3, "coord_origin": "TOPLEFT" }, "text": ", 108565 (2022)", "orig": ", 108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "list_item", "bbox": { "l": 134.8, "t": 218.3, "r": 480.6, "b": 270.3, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 226.4, "r_x1": 145.7, "r_y1": 226.4, "r_x2": 145.7, "r_y2": 218.3, "r_x3": 134.8, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.0, "r_y0": 226.4, "r_x1": 480.6, "r_y1": 226.4, "r_x2": 480.6, "r_y2": 218.3, "r_x3": 150.0, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 237.3, "r_x1": 480.6, "r_y1": 237.3, "r_x2": 480.6, "r_y2": 229.3, "r_x3": 151.5, "r_y3": 229.3, "coord_origin": "TOPLEFT" }, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 248.3, "r_x1": 480.6, "r_y1": 248.3, "r_x2": 480.6, "r_y2": 240.2, "r_x3": 151.5, "r_y3": 240.2, "coord_origin": "TOPLEFT" }, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 259.3, "r_x1": 293.4, "r_y1": 259.3, "r_x2": 293.4, "r_y2": 251.2, "r_x3": 151.5, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 297.0, "r_y0": 259.3, "r_x1": 480.6, "r_y1": 259.3, "r_x2": 480.6, "r_y2": 251.8, "r_x3": 297.0, "r_y3": 251.8, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 270.3, "r_x1": 175.1, "r_y1": 270.3, "r_x2": 175.1, "r_y2": 262.8, "r_x3": 151.5, "r_y3": 262.8, "coord_origin": "TOPLEFT" }, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "list_item", "bbox": { "l": 134.8, "t": 273.1, "r": 480.6, "b": 314.0, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 281.2, "r_x1": 146.4, "r_y1": 281.2, "r_x2": 146.4, "r_y2": 273.1, "r_x3": 134.8, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 281.2, "r_x1": 480.6, "r_y1": 281.2, "r_x2": 480.6, "r_y2": 273.1, "r_x3": 150.9, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "orig": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 292.1, "r_x1": 480.6, "r_y1": 292.1, "r_x2": 480.6, "r_y2": 284.1, "r_x3": 151.5, "r_y3": 284.1, "coord_origin": "TOPLEFT" }, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 303.1, "r_x1": 480.6, "r_y1": 303.1, "r_x2": 480.6, "r_y2": 295.0, "r_x3": 151.5, "r_y3": 295.0, "coord_origin": "TOPLEFT" }, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 314.0, "r_x1": 236.0, "r_y1": 314.0, "r_x2": 236.0, "r_y2": 306.0, "r_x3": 151.5, "r_y3": 306.0, "coord_origin": "TOPLEFT" }, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "list_item", "bbox": { "l": 134.8, "t": 316.9, "r": 480.6, "b": 346.9, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 325.0, "r_x1": 145.7, "r_y1": 325.0, "r_x2": 145.7, "r_y2": 316.9, "r_x3": 134.8, "r_y3": 316.9, "coord_origin": "TOPLEFT" }, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.0, "r_y0": 325.0, "r_x1": 480.6, "r_y1": 325.0, "r_x2": 480.6, "r_y2": 316.9, "r_x3": 150.0, "r_y3": 316.9, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 336.0, "r_x1": 480.6, "r_y1": 336.0, "r_x2": 480.6, "r_y2": 327.9, "r_x3": 151.5, "r_y3": 327.9, "coord_origin": "TOPLEFT" }, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 346.9, "r_x1": 335.1, "r_y1": 346.9, "r_x2": 335.1, "r_y2": 338.9, "r_x3": 151.5, "r_y3": 338.9, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 7, "page_no": 13, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 144.0, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.7, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 144.0, "r_y1": 101.8, "r_x2": 144.0, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14" }, { "label": "page_header", "id": 6, "page_no": 13, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.79, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "list_item", "id": 5, "page_no": 13, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 134.8, "t": 119.7, "r": 480.6, "b": 149.7, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 146.1, "r_y1": 127.7, "r_x2": 146.1, "r_y2": 119.7, "r_x3": 134.8, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 119.7, "r_x3": 150.5, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 138.7, "r_x1": 480.6, "r_y1": 138.7, "r_x2": 480.6, "r_y2": 130.6, "r_x3": 151.5, "r_y3": 130.6, "coord_origin": "TOPLEFT" }, "text": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "orig": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 149.7, "r_x1": 427.5, "r_y1": 149.7, "r_x2": 427.5, "r_y2": 141.6, "r_x3": 151.5, "r_y3": 141.6, "coord_origin": "TOPLEFT" }, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "18. Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruction network for table structure recognition. In: Proceedings of the IEEE/CVF International Conference on Computer Vision. pp. 1295-1304 (2021)" }, { "label": "list_item", "id": 3, "page_no": 13, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 134.8, "t": 152.6, "r": 480.6, "b": 193.5, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 160.6, "r_x1": 146.2, "r_y1": 160.6, "r_x2": 146.2, "r_y2": 152.6, "r_x3": 134.8, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.7, "r_y0": 160.6, "r_x1": 480.6, "r_y1": 160.6, "r_x2": 480.6, "r_y2": 152.6, "r_x3": 150.7, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "orig": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 171.6, "r_x1": 480.6, "r_y1": 171.6, "r_x2": 480.6, "r_y2": 163.5, "r_x3": 151.5, "r_y3": 163.5, "coord_origin": "TOPLEFT" }, "text": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "orig": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 182.5, "r_x1": 280.6, "r_y1": 182.5, "r_x2": 280.6, "r_y2": 174.5, "r_x3": 151.5, "r_y3": 174.5, "coord_origin": "TOPLEFT" }, "text": "ble recognition to html (2021).", "orig": "ble recognition to html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.1, "r_y0": 182.6, "r_x1": 478.0, "r_y1": 182.6, "r_x2": 478.0, "r_y2": 175.1, "r_x3": 285.1, "r_y3": 175.1, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0, "r_y0": 182.5, "r_x1": 480.6, "r_y1": 182.5, "r_x2": 480.6, "r_y2": 174.5, "r_x3": 478.0, "r_y3": 174.5, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 193.5, "r_x1": 302.1, "r_y1": 193.5, "r_x2": 302.1, "r_y2": 186.1, "r_x3": 151.5, "r_y3": 186.1, "coord_origin": "TOPLEFT" }, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "19. Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup's solution for icdar 2021 competition on scientific literature parsing task b: Table recognition to html (2021). https://doi.org/10.48550/ARXIV.2105.01848 , https://arxiv.org/abs/2105.01848" }, { "label": "list_item", "id": 4, "page_no": 13, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 134.8, "t": 196.4, "r": 480.6, "b": 215.4, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 204.5, "r_x1": 145.7, "r_y1": 204.5, "r_x2": 145.7, "r_y2": 196.4, "r_x3": 134.8, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.9, "r_y0": 204.5, "r_x1": 480.6, "r_y1": 204.5, "r_x2": 480.6, "r_y2": 196.4, "r_x3": 149.9, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 215.4, "r_x1": 318.6, "r_y1": 215.4, "r_x2": 318.6, "r_y2": 207.3, "r_x3": 151.5, "r_y3": 207.3, "coord_origin": "TOPLEFT" }, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.6, "r_y0": 215.2, "r_x1": 337.5, "r_y1": 215.2, "r_x2": 337.5, "r_y2": 207.3, "r_x3": 321.6, "r_y3": 207.3, "coord_origin": "TOPLEFT" }, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.5, "r_y0": 215.4, "r_x1": 399.5, "r_y1": 215.4, "r_x2": 399.5, "r_y2": 207.3, "r_x3": 337.5, "r_y3": 207.3, "coord_origin": "TOPLEFT" }, "text": ", 108565 (2022)", "orig": ", 108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "20. Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table structure recognizer. Pattern Recognition 126 , 108565 (2022)" }, { "label": "list_item", "id": 0, "page_no": 13, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 134.8, "t": 218.3, "r": 480.6, "b": 270.3, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 226.4, "r_x1": 145.7, "r_y1": 226.4, "r_x2": 145.7, "r_y2": 218.3, "r_x3": 134.8, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.0, "r_y0": 226.4, "r_x1": 480.6, "r_y1": 226.4, "r_x2": 480.6, "r_y2": 218.3, "r_x3": 150.0, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 237.3, "r_x1": 480.6, "r_y1": 237.3, "r_x2": 480.6, "r_y2": 229.3, "r_x3": 151.5, "r_y3": 229.3, "coord_origin": "TOPLEFT" }, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 248.3, "r_x1": 480.6, "r_y1": 248.3, "r_x2": 480.6, "r_y2": 240.2, "r_x3": 151.5, "r_y3": 240.2, "coord_origin": "TOPLEFT" }, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 259.3, "r_x1": 293.4, "r_y1": 259.3, "r_x2": 293.4, "r_y2": 251.2, "r_x3": 151.5, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 297.0, "r_y0": 259.3, "r_x1": 480.6, "r_y1": 259.3, "r_x2": 480.6, "r_y2": 251.8, "r_x3": 297.0, "r_y3": 251.8, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 270.3, "r_x1": 175.1, "r_y1": 270.3, "r_x2": 175.1, "r_y2": 262.8, "r_x3": 151.5, "r_y3": 262.8, "coord_origin": "TOPLEFT" }, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "21. Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vision (WACV). pp. 697-706 (2021). https://doi.org/10.1109/WACV48630.2021. 00074" }, { "label": "list_item", "id": 1, "page_no": 13, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 134.8, "t": 273.1, "r": 480.6, "b": 314.0, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 281.2, "r_x1": 146.4, "r_y1": 281.2, "r_x2": 146.4, "r_y2": 273.1, "r_x3": 134.8, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 281.2, "r_x1": 480.6, "r_y1": 281.2, "r_x2": 480.6, "r_y2": 273.1, "r_x3": 150.9, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "orig": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 292.1, "r_x1": 480.6, "r_y1": 292.1, "r_x2": 480.6, "r_y2": 284.1, "r_x3": 151.5, "r_y3": 284.1, "coord_origin": "TOPLEFT" }, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 303.1, "r_x1": 480.6, "r_y1": 303.1, "r_x2": 480.6, "r_y2": 295.0, "r_x3": 151.5, "r_y3": 295.0, "coord_origin": "TOPLEFT" }, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 314.0, "r_x1": 236.0, "r_y1": 314.0, "r_x2": 236.0, "r_y2": 306.0, "r_x3": 151.5, "r_y3": 306.0, "coord_origin": "TOPLEFT" }, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "22. Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition: Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M. (eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Publishing, Cham (2020)" }, { "label": "list_item", "id": 2, "page_no": 13, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 134.8, "t": 316.9, "r": 480.6, "b": 346.9, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 325.0, "r_x1": 145.7, "r_y1": 325.0, "r_x2": 145.7, "r_y2": 316.9, "r_x3": 134.8, "r_y3": 316.9, "coord_origin": "TOPLEFT" }, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.0, "r_y0": 325.0, "r_x1": 480.6, "r_y1": 325.0, "r_x2": 480.6, "r_y2": 316.9, "r_x3": 150.0, "r_y3": 316.9, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 336.0, "r_x1": 480.6, "r_y1": 336.0, "r_x2": 480.6, "r_y2": 327.9, "r_x3": 151.5, "r_y3": 327.9, "coord_origin": "TOPLEFT" }, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 346.9, "r_x1": 335.1, "r_y1": 346.9, "r_x2": 335.1, "r_y2": 338.9, "r_x3": 151.5, "r_y3": 338.9, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "23. Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document layout analysis. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1015-1022. IEEE (2019)" } ], "body": [ { "label": "list_item", "id": 5, "page_no": 13, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 134.8, "t": 119.7, "r": 480.6, "b": 149.7, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 127.7, "r_x1": 146.1, "r_y1": 127.7, "r_x2": 146.1, "r_y2": 119.7, "r_x3": 134.8, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 127.7, "r_x1": 480.6, "r_y1": 127.7, "r_x2": 480.6, "r_y2": 119.7, "r_x3": 150.5, "r_y3": 119.7, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 138.7, "r_x1": 480.6, "r_y1": 138.7, "r_x2": 480.6, "r_y2": 130.6, "r_x3": 151.5, "r_y3": 130.6, "coord_origin": "TOPLEFT" }, "text": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "orig": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 149.7, "r_x1": 427.5, "r_y1": 149.7, "r_x2": 427.5, "r_y2": 141.6, "r_x3": 151.5, "r_y3": 141.6, "coord_origin": "TOPLEFT" }, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "18. Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruction network for table structure recognition. In: Proceedings of the IEEE/CVF International Conference on Computer Vision. pp. 1295-1304 (2021)" }, { "label": "list_item", "id": 3, "page_no": 13, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 134.8, "t": 152.6, "r": 480.6, "b": 193.5, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 160.6, "r_x1": 146.2, "r_y1": 160.6, "r_x2": 146.2, "r_y2": 152.6, "r_x3": 134.8, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.7, "r_y0": 160.6, "r_x1": 480.6, "r_y1": 160.6, "r_x2": 480.6, "r_y2": 152.6, "r_x3": 150.7, "r_y3": 152.6, "coord_origin": "TOPLEFT" }, "text": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "orig": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 171.6, "r_x1": 480.6, "r_y1": 171.6, "r_x2": 480.6, "r_y2": 163.5, "r_x3": 151.5, "r_y3": 163.5, "coord_origin": "TOPLEFT" }, "text": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "orig": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 182.5, "r_x1": 280.6, "r_y1": 182.5, "r_x2": 280.6, "r_y2": 174.5, "r_x3": 151.5, "r_y3": 174.5, "coord_origin": "TOPLEFT" }, "text": "ble recognition to html (2021).", "orig": "ble recognition to html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.1, "r_y0": 182.6, "r_x1": 478.0, "r_y1": 182.6, "r_x2": 478.0, "r_y2": 175.1, "r_x3": 285.1, "r_y3": 175.1, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.0, "r_y0": 182.5, "r_x1": 480.6, "r_y1": 182.5, "r_x2": 480.6, "r_y2": 174.5, "r_x3": 478.0, "r_y3": 174.5, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 193.5, "r_x1": 302.1, "r_y1": 193.5, "r_x2": 302.1, "r_y2": 186.1, "r_x3": 151.5, "r_y3": 186.1, "coord_origin": "TOPLEFT" }, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "19. Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup's solution for icdar 2021 competition on scientific literature parsing task b: Table recognition to html (2021). https://doi.org/10.48550/ARXIV.2105.01848 , https://arxiv.org/abs/2105.01848" }, { "label": "list_item", "id": 4, "page_no": 13, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 134.8, "t": 196.4, "r": 480.6, "b": 215.4, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 204.5, "r_x1": 145.7, "r_y1": 204.5, "r_x2": 145.7, "r_y2": 196.4, "r_x3": 134.8, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.9, "r_y0": 204.5, "r_x1": 480.6, "r_y1": 204.5, "r_x2": 480.6, "r_y2": 196.4, "r_x3": 149.9, "r_y3": 196.4, "coord_origin": "TOPLEFT" }, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 215.4, "r_x1": 318.6, "r_y1": 215.4, "r_x2": 318.6, "r_y2": 207.3, "r_x3": 151.5, "r_y3": 207.3, "coord_origin": "TOPLEFT" }, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.6, "r_y0": 215.2, "r_x1": 337.5, "r_y1": 215.2, "r_x2": 337.5, "r_y2": 207.3, "r_x3": 321.6, "r_y3": 207.3, "coord_origin": "TOPLEFT" }, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.5, "r_y0": 215.4, "r_x1": 399.5, "r_y1": 215.4, "r_x2": 399.5, "r_y2": 207.3, "r_x3": 337.5, "r_y3": 207.3, "coord_origin": "TOPLEFT" }, "text": ", 108565 (2022)", "orig": ", 108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "20. Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table structure recognizer. Pattern Recognition 126 , 108565 (2022)" }, { "label": "list_item", "id": 0, "page_no": 13, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 134.8, "t": 218.3, "r": 480.6, "b": 270.3, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 226.4, "r_x1": 145.7, "r_y1": 226.4, "r_x2": 145.7, "r_y2": 218.3, "r_x3": 134.8, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.0, "r_y0": 226.4, "r_x1": 480.6, "r_y1": 226.4, "r_x2": 480.6, "r_y2": 218.3, "r_x3": 150.0, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 237.3, "r_x1": 480.6, "r_y1": 237.3, "r_x2": 480.6, "r_y2": 229.3, "r_x3": 151.5, "r_y3": 229.3, "coord_origin": "TOPLEFT" }, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 248.3, "r_x1": 480.6, "r_y1": 248.3, "r_x2": 480.6, "r_y2": 240.2, "r_x3": 151.5, "r_y3": 240.2, "coord_origin": "TOPLEFT" }, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 259.3, "r_x1": 293.4, "r_y1": 259.3, "r_x2": 293.4, "r_y2": 251.2, "r_x3": 151.5, "r_y3": 251.2, "coord_origin": "TOPLEFT" }, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 297.0, "r_y0": 259.3, "r_x1": 480.6, "r_y1": 259.3, "r_x2": 480.6, "r_y2": 251.8, "r_x3": 297.0, "r_y3": 251.8, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 270.3, "r_x1": 175.1, "r_y1": 270.3, "r_x2": 175.1, "r_y2": 262.8, "r_x3": 151.5, "r_y3": 262.8, "coord_origin": "TOPLEFT" }, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "21. Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vision (WACV). pp. 697-706 (2021). https://doi.org/10.1109/WACV48630.2021. 00074" }, { "label": "list_item", "id": 1, "page_no": 13, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 134.8, "t": 273.1, "r": 480.6, "b": 314.0, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 281.2, "r_x1": 146.4, "r_y1": 281.2, "r_x2": 146.4, "r_y2": 273.1, "r_x3": 134.8, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.9, "r_y0": 281.2, "r_x1": 480.6, "r_y1": 281.2, "r_x2": 480.6, "r_y2": 273.1, "r_x3": 150.9, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "orig": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 292.1, "r_x1": 480.6, "r_y1": 292.1, "r_x2": 480.6, "r_y2": 284.1, "r_x3": 151.5, "r_y3": 284.1, "coord_origin": "TOPLEFT" }, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 303.1, "r_x1": 480.6, "r_y1": 303.1, "r_x2": 480.6, "r_y2": 295.0, "r_x3": 151.5, "r_y3": 295.0, "coord_origin": "TOPLEFT" }, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 314.0, "r_x1": 236.0, "r_y1": 314.0, "r_x2": 236.0, "r_y2": 306.0, "r_x3": 151.5, "r_y3": 306.0, "coord_origin": "TOPLEFT" }, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "22. Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition: Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M. (eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Publishing, Cham (2020)" }, { "label": "list_item", "id": 2, "page_no": 13, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 134.8, "t": 316.9, "r": 480.6, "b": 346.9, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 325.0, "r_x1": 145.7, "r_y1": 325.0, "r_x2": 145.7, "r_y2": 316.9, "r_x3": 134.8, "r_y3": 316.9, "coord_origin": "TOPLEFT" }, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.0, "r_y0": 325.0, "r_x1": 480.6, "r_y1": 325.0, "r_x2": 480.6, "r_y2": 316.9, "r_x3": 150.0, "r_y3": 316.9, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 336.0, "r_x1": 480.6, "r_y1": 336.0, "r_x2": 480.6, "r_y2": 327.9, "r_x3": 151.5, "r_y3": 327.9, "coord_origin": "TOPLEFT" }, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.5, "r_y0": 346.9, "r_x1": 335.1, "r_y1": 346.9, "r_x2": 335.1, "r_y2": 338.9, "r_x3": 151.5, "r_y3": 338.9, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "23. Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document layout analysis. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1015-1022. IEEE (2019)" } ], "headers": [ { "label": "page_header", "id": 7, "page_no": 13, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 134.8, "t": 93.8, "r": 144.0, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.7, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.8, "r_y0": 101.8, "r_x1": 144.0, "r_y1": 101.8, "r_x2": 144.0, "r_y2": 93.8, "r_x3": 134.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14" }, { "label": "page_header", "id": 6, "page_no": 13, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 167.8, "t": 93.8, "r": 231.7, "b": 101.8, "coord_origin": "TOPLEFT" }, "confidence": 0.79, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.8, "r_y0": 101.8, "r_x1": 178.1, "r_y1": 101.8, "r_x2": 178.1, "r_y2": 93.8, "r_x3": 167.8, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.4, "r_y0": 101.8, "r_x1": 231.7, "r_y1": 101.8, "r_x2": 231.7, "r_y2": 93.8, "r_x3": 182.4, "r_y3": 93.8, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } } ]